From b9681557573b1d4f848c7b628521e8214a7a19bd Mon Sep 17 00:00:00 2001
From: Linxin Song <rm.social.song1@gmail.com>
Date: Wed, 30 Jul 2025 19:35:20 -0700
Subject: [PATCH] CoACT initialize (#292)

---
 desktop_env/controllers/python.py             |   76 +
 desktop_env/server/main.py                    |  225 +
 mm_agents/coact/OAI_CONFIG_LIST               |   27 +
 mm_agents/coact/__init__.py                   |    0
 mm_agents/coact/autogen/__init__.py           |   81 +
 mm_agents/coact/autogen/agentchat/__init__.py |   38 +
 mm_agents/coact/autogen/agentchat/agent.py    |  182 +
 .../autogen/agentchat/assistant_agent.py      |   85 +
 mm_agents/coact/autogen/agentchat/chat.py     |  309 ++
 .../autogen/agentchat/contrib/__init__.py     |    5 +
 .../contrib/capabilities/__init__.py          |    5 +
 .../contrib/capabilities/agent_capability.py  |   20 +
 .../contrib/capabilities/generate_images.py   |  301 ++
 .../contrib/capabilities/teachability.py      |  393 ++
 .../contrib/capabilities/text_compressors.py  |   66 +
 .../contrib/capabilities/tools_capability.py  |   22 +
 .../capabilities/transform_messages.py        |   93 +
 .../contrib/capabilities/transforms.py        |  579 +++
 .../contrib/capabilities/transforms_util.py   |  122 +
 .../contrib/capabilities/vision_capability.py |  212 +
 .../autogen/agentchat/contrib/img_utils.py    |  411 ++
 .../contrib/multimodal_conversable_agent.py   |  153 +
 .../autogen/agentchat/conversable_agent.py    | 4023 +++++++++++++++++
 .../coact/autogen/agentchat/group/__init__.py |   64 +
 .../agentchat/group/available_condition.py    |   91 +
 .../agentchat/group/context_condition.py      |   77 +
 .../agentchat/group/context_expression.py     |  238 +
 .../autogen/agentchat/group/context_str.py    |   41 +
 .../agentchat/group/context_variables.py      |  192 +
 .../agentchat/group/group_tool_executor.py    |  202 +
 .../autogen/agentchat/group/group_utils.py    |  636 +++
 .../coact/autogen/agentchat/group/handoffs.py |  320 ++
 .../autogen/agentchat/group/llm_condition.py  |   93 +
 .../agentchat/group/multi_agent_chat.py       |  237 +
 .../autogen/agentchat/group/on_condition.py   |   58 +
 .../agentchat/group/on_context_condition.py   |   54 +
 .../agentchat/group/patterns/__init__.py      |   18 +
 .../autogen/agentchat/group/patterns/auto.py  |  159 +
 .../agentchat/group/patterns/manual.py        |  176 +
 .../agentchat/group/patterns/pattern.py       |  294 ++
 .../agentchat/group/patterns/random.py        |  106 +
 .../agentchat/group/patterns/round_robin.py   |  117 +
 .../autogen/agentchat/group/reply_result.py   |   26 +
 .../group/speaker_selection_result.py         |   41 +
 .../agentchat/group/targets/__init__.py       |    4 +
 .../group/targets/group_chat_target.py        |  132 +
 .../group/targets/group_manager_target.py     |  151 +
 .../group/targets/transition_target.py        |  413 ++
 .../group/targets/transition_utils.py         |    6 +
 .../coact/autogen/agentchat/groupchat.py      | 1694 +++++++
 .../autogen/agentchat/realtime/__init__.py    |    3 +
 .../realtime/experimental/__init__.py         |   20 +
 .../experimental/audio_adapters/__init__.py   |    8 +
 .../audio_adapters/twilio_audio_adapter.py    |  148 +
 .../audio_adapters/websocket_audio_adapter.py |  139 +
 .../realtime/experimental/audio_observer.py   |   42 +
 .../realtime/experimental/clients/__init__.py |   15 +
 .../experimental/clients/gemini/__init__.py   |    7 +
 .../experimental/clients/gemini/client.py     |  274 ++
 .../experimental/clients/oai/__init__.py      |    8 +
 .../experimental/clients/oai/base_client.py   |  220 +
 .../experimental/clients/oai/rtc_client.py    |  243 +
 .../experimental/clients/oai/utils.py         |   48 +
 .../experimental/clients/realtime_client.py   |  190 +
 .../experimental/function_observer.py         |   85 +
 .../realtime/experimental/realtime_agent.py   |  158 +
 .../realtime/experimental/realtime_events.py  |   42 +
 .../experimental/realtime_observer.py         |  100 +
 .../realtime/experimental/realtime_swarm.py   |  483 ++
 .../realtime/experimental/websockets.py       |   21 +
 .../agentchat/realtime_agent/__init__.py      |   21 +
 .../autogen/agentchat/user_proxy_agent.py     |  111 +
 mm_agents/coact/autogen/agentchat/utils.py    |  206 +
 mm_agents/coact/autogen/code_utils.py         |  596 +++
 mm_agents/coact/autogen/coding/__init__.py    |   22 +
 mm_agents/coact/autogen/coding/base.py        |  119 +
 .../docker_commandline_code_executor.py       |  268 ++
 mm_agents/coact/autogen/coding/factory.py     |   47 +
 .../coact/autogen/coding/func_with_reqs.py    |  202 +
 .../coact/autogen/coding/jupyter/__init__.py  |   23 +
 .../coact/autogen/coding/jupyter/base.py      |   36 +
 .../coding/jupyter/docker_jupyter_server.py   |  167 +
 .../jupyter/embedded_ipython_code_executor.py |  182 +
 .../autogen/coding/jupyter/import_utils.py    |   82 +
 .../autogen/coding/jupyter/jupyter_client.py  |  231 +
 .../coding/jupyter/jupyter_code_executor.py   |  160 +
 .../coding/jupyter/local_jupyter_server.py    |  172 +
 .../coding/local_commandline_code_executor.py |  405 ++
 .../autogen/coding/markdown_code_extractor.py |   45 +
 mm_agents/coact/autogen/coding/utils.py       |   56 +
 mm_agents/coact/autogen/doc_utils.py          |   34 +
 mm_agents/coact/autogen/events/__init__.py    |    7 +
 .../coact/autogen/events/agent_events.py      | 1014 +++++
 mm_agents/coact/autogen/events/base_event.py  |   99 +
 .../coact/autogen/events/client_events.py     |  167 +
 mm_agents/coact/autogen/events/helpers.py     |   36 +
 mm_agents/coact/autogen/events/print_event.py |   46 +
 mm_agents/coact/autogen/exception_utils.py    |   73 +
 .../coact/autogen/fast_depends/__init__.py    |   16 +
 .../coact/autogen/fast_depends/_compat.py     |   80 +
 .../autogen/fast_depends/core/__init__.py     |   14 +
 .../coact/autogen/fast_depends/core/build.py  |  225 +
 .../coact/autogen/fast_depends/core/model.py  |  576 +++
 .../fast_depends/dependencies/__init__.py     |   15 +
 .../fast_depends/dependencies/model.py        |   29 +
 .../fast_depends/dependencies/provider.py     |   39 +
 .../autogen/fast_depends/library/__init__.py  |   10 +
 .../autogen/fast_depends/library/model.py     |   46 +
 mm_agents/coact/autogen/fast_depends/py.typed |    6 +
 .../coact/autogen/fast_depends/schema.py      |   66 +
 mm_agents/coact/autogen/fast_depends/use.py   |  280 ++
 mm_agents/coact/autogen/fast_depends/utils.py |  187 +
 mm_agents/coact/autogen/formatting_utils.py   |   83 +
 mm_agents/coact/autogen/function_utils.py     |   13 +
 mm_agents/coact/autogen/graph_utils.py        |  178 +
 mm_agents/coact/autogen/import_utils.py       |  526 +++
 mm_agents/coact/autogen/interop/__init__.py   |   22 +
 .../coact/autogen/interop/crewai/__init__.py  |    7 +
 .../coact/autogen/interop/crewai/crewai.py    |   88 +
 .../coact/autogen/interop/interoperability.py |   71 +
 .../coact/autogen/interop/interoperable.py    |   46 +
 .../autogen/interop/langchain/__init__.py     |    8 +
 .../langchain/langchain_chat_model_factory.py |  155 +
 .../interop/langchain/langchain_tool.py       |   82 +
 .../coact/autogen/interop/litellm/__init__.py |    7 +
 .../interop/litellm/litellm_config_factory.py |  179 +
 .../autogen/interop/pydantic_ai/__init__.py   |    7 +
 .../interop/pydantic_ai/pydantic_ai.py        |  168 +
 mm_agents/coact/autogen/interop/registry.py   |   69 +
 mm_agents/coact/autogen/io/__init__.py        |   15 +
 mm_agents/coact/autogen/io/base.py            |  151 +
 mm_agents/coact/autogen/io/console.py         |   56 +
 .../coact/autogen/io/processors/__init__.py   |   12 +
 mm_agents/coact/autogen/io/processors/base.py |   21 +
 .../io/processors/console_event_processor.py  |   56 +
 mm_agents/coact/autogen/io/run_response.py    |  293 ++
 .../coact/autogen/io/thread_io_stream.py      |   63 +
 mm_agents/coact/autogen/io/websockets.py      |  213 +
 mm_agents/coact/autogen/json_utils.py         |   43 +
 mm_agents/coact/autogen/llm_config.py         |  382 ++
 mm_agents/coact/autogen/logger/__init__.py    |   11 +
 mm_agents/coact/autogen/logger/base_logger.py |  128 +
 mm_agents/coact/autogen/logger/file_logger.py |  261 ++
 .../coact/autogen/logger/logger_factory.py    |   42 +
 .../coact/autogen/logger/logger_utils.py      |   57 +
 .../coact/autogen/logger/sqlite_logger.py     |  523 +++
 mm_agents/coact/autogen/messages/__init__.py  |    7 +
 .../coact/autogen/messages/agent_messages.py  |  948 ++++
 .../coact/autogen/messages/base_message.py    |  107 +
 .../coact/autogen/messages/client_messages.py |  171 +
 .../coact/autogen/messages/print_message.py   |   49 +
 mm_agents/coact/autogen/oai/__init__.py       |   53 +
 mm_agents/coact/autogen/oai/anthropic.py      |  714 +++
 mm_agents/coact/autogen/oai/bedrock.py        |  628 +++
 mm_agents/coact/autogen/oai/cerebras.py       |  299 ++
 mm_agents/coact/autogen/oai/client.py         | 1444 ++++++
 mm_agents/coact/autogen/oai/client_utils.py   |  169 +
 mm_agents/coact/autogen/oai/cohere.py         |  479 ++
 mm_agents/coact/autogen/oai/gemini.py         | 1007 +++++
 mm_agents/coact/autogen/oai/gemini_types.py   |  156 +
 mm_agents/coact/autogen/oai/groq.py           |  305 ++
 mm_agents/coact/autogen/oai/mistral.py        |  303 ++
 .../coact/autogen/oai/oai_models/__init__.py  |   11 +
 .../coact/autogen/oai/oai_models/_models.py   |   16 +
 .../autogen/oai/oai_models/chat_completion.py |   87 +
 .../oai/oai_models/chat_completion_audio.py   |   32 +
 .../oai/oai_models/chat_completion_message.py |   86 +
 .../chat_completion_message_tool_call.py      |   37 +
 .../chat_completion_token_logprob.py          |   63 +
 .../oai/oai_models/completion_usage.py        |   60 +
 mm_agents/coact/autogen/oai/ollama.py         |  643 +++
 mm_agents/coact/autogen/oai/openai_utils.py   |  881 ++++
 mm_agents/coact/autogen/oai/together.py       |  370 ++
 mm_agents/coact/autogen/retrieve_utils.py     |  491 ++
 mm_agents/coact/autogen/runtime_logging.py    |  160 +
 mm_agents/coact/autogen/token_count_utils.py  |  265 ++
 mm_agents/coact/autogen/tools/__init__.py     |   20 +
 .../coact/autogen/tools/contrib/__init__.py   |    9 +
 .../autogen/tools/contrib/time/__init__.py    |    7 +
 .../coact/autogen/tools/contrib/time/time.py  |   41 +
 .../autogen/tools/dependency_injection.py     |  254 ++
 .../autogen/tools/experimental/__init__.py    |   48 +
 .../experimental/browser_use/__init__.py      |    7 +
 .../experimental/browser_use/browser_use.py   |  161 +
 .../tools/experimental/crawl4ai/__init__.py   |    7 +
 .../tools/experimental/crawl4ai/crawl4ai.py   |  153 +
 .../experimental/deep_research/__init__.py    |    7 +
 .../deep_research/deep_research.py            |  328 ++
 .../tools/experimental/duckduckgo/__init__.py |    7 +
 .../duckduckgo/duckduckgo_search.py           |  109 +
 .../tools/experimental/google/__init__.py     |   14 +
 .../google/authentication/__init__.py         |   11 +
 .../credentials_hosted_provider.py            |   43 +
 .../credentials_local_provider.py             |   91 +
 .../authentication/credentials_provider.py    |   35 +
 .../experimental/google/drive/__init__.py     |    9 +
 .../google/drive/drive_functions.py           |  124 +
 .../experimental/google/drive/toolkit.py      |   88 +
 .../tools/experimental/google/model.py        |   17 +
 .../experimental/google/toolkit_protocol.py   |   19 +
 .../experimental/google_search/__init__.py    |    8 +
 .../google_search/google_search.py            |   93 +
 .../google_search/youtube_search.py           |  181 +
 .../experimental/messageplatform/__init__.py  |   17 +
 .../messageplatform/discord/__init__.py       |    7 +
 .../messageplatform/discord/discord.py        |  288 ++
 .../messageplatform/slack/__init__.py         |    7 +
 .../messageplatform/slack/slack.py            |  391 ++
 .../messageplatform/telegram/__init__.py      |    7 +
 .../messageplatform/telegram/telegram.py      |  275 ++
 .../tools/experimental/perplexity/__init__.py |    7 +
 .../perplexity/perplexity_search.py           |  260 ++
 .../tools/experimental/reliable/__init__.py   |   10 +
 .../tools/experimental/reliable/reliable.py   | 1316 ++++++
 .../tools/experimental/tavily/__init__.py     |    7 +
 .../experimental/tavily/tavily_search.py      |  183 +
 .../web_search_preview/__init__.py            |    7 +
 .../web_search_preview/web_search_preview.py  |  114 +
 .../tools/experimental/wikipedia/__init__.py  |    7 +
 .../tools/experimental/wikipedia/wikipedia.py |  287 ++
 .../coact/autogen/tools/function_utils.py     |  411 ++
 mm_agents/coact/autogen/tools/tool.py         |  187 +
 mm_agents/coact/autogen/tools/toolkit.py      |   86 +
 mm_agents/coact/autogen/types.py              |   29 +
 mm_agents/coact/coding_agent.py               |   78 +
 mm_agents/coact/cua_agent.py                  |  328 ++
 mm_agents/coact/operator_agent.py             |  305 ++
 run_coact.py                                  |  266 ++
 228 files changed, 42386 insertions(+)
 create mode 100644 mm_agents/coact/OAI_CONFIG_LIST
 create mode 100644 mm_agents/coact/__init__.py
 create mode 100644 mm_agents/coact/autogen/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/assistant_agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/chat.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/agent_capability.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/generate_images.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/teachability.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/text_compressors.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/tools_capability.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/transform_messages.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms_util.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/capabilities/vision_capability.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/img_utils.py
 create mode 100644 mm_agents/coact/autogen/agentchat/contrib/multimodal_conversable_agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/conversable_agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/available_condition.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/context_condition.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/context_expression.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/context_str.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/context_variables.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/group_tool_executor.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/group_utils.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/handoffs.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/llm_condition.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/multi_agent_chat.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/on_condition.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/on_context_condition.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/auto.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/manual.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/pattern.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/random.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/patterns/round_robin.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/reply_result.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/speaker_selection_result.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/targets/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/targets/group_chat_target.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/targets/group_manager_target.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/targets/transition_target.py
 create mode 100644 mm_agents/coact/autogen/agentchat/group/targets/transition_utils.py
 create mode 100644 mm_agents/coact/autogen/agentchat/groupchat.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/audio_observer.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/client.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/base_client.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/utils.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/clients/realtime_client.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/function_observer.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_events.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_observer.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_swarm.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime/experimental/websockets.py
 create mode 100644 mm_agents/coact/autogen/agentchat/realtime_agent/__init__.py
 create mode 100644 mm_agents/coact/autogen/agentchat/user_proxy_agent.py
 create mode 100644 mm_agents/coact/autogen/agentchat/utils.py
 create mode 100644 mm_agents/coact/autogen/code_utils.py
 create mode 100644 mm_agents/coact/autogen/coding/__init__.py
 create mode 100644 mm_agents/coact/autogen/coding/base.py
 create mode 100644 mm_agents/coact/autogen/coding/docker_commandline_code_executor.py
 create mode 100644 mm_agents/coact/autogen/coding/factory.py
 create mode 100644 mm_agents/coact/autogen/coding/func_with_reqs.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/__init__.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/base.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/docker_jupyter_server.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/embedded_ipython_code_executor.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/import_utils.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/jupyter_client.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/jupyter_code_executor.py
 create mode 100644 mm_agents/coact/autogen/coding/jupyter/local_jupyter_server.py
 create mode 100644 mm_agents/coact/autogen/coding/local_commandline_code_executor.py
 create mode 100644 mm_agents/coact/autogen/coding/markdown_code_extractor.py
 create mode 100644 mm_agents/coact/autogen/coding/utils.py
 create mode 100644 mm_agents/coact/autogen/doc_utils.py
 create mode 100644 mm_agents/coact/autogen/events/__init__.py
 create mode 100644 mm_agents/coact/autogen/events/agent_events.py
 create mode 100644 mm_agents/coact/autogen/events/base_event.py
 create mode 100644 mm_agents/coact/autogen/events/client_events.py
 create mode 100644 mm_agents/coact/autogen/events/helpers.py
 create mode 100644 mm_agents/coact/autogen/events/print_event.py
 create mode 100644 mm_agents/coact/autogen/exception_utils.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/__init__.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/_compat.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/core/__init__.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/core/build.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/core/model.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/dependencies/__init__.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/dependencies/model.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/dependencies/provider.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/library/__init__.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/library/model.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/py.typed
 create mode 100644 mm_agents/coact/autogen/fast_depends/schema.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/use.py
 create mode 100644 mm_agents/coact/autogen/fast_depends/utils.py
 create mode 100644 mm_agents/coact/autogen/formatting_utils.py
 create mode 100644 mm_agents/coact/autogen/function_utils.py
 create mode 100644 mm_agents/coact/autogen/graph_utils.py
 create mode 100644 mm_agents/coact/autogen/import_utils.py
 create mode 100644 mm_agents/coact/autogen/interop/__init__.py
 create mode 100644 mm_agents/coact/autogen/interop/crewai/__init__.py
 create mode 100644 mm_agents/coact/autogen/interop/crewai/crewai.py
 create mode 100644 mm_agents/coact/autogen/interop/interoperability.py
 create mode 100644 mm_agents/coact/autogen/interop/interoperable.py
 create mode 100644 mm_agents/coact/autogen/interop/langchain/__init__.py
 create mode 100644 mm_agents/coact/autogen/interop/langchain/langchain_chat_model_factory.py
 create mode 100644 mm_agents/coact/autogen/interop/langchain/langchain_tool.py
 create mode 100644 mm_agents/coact/autogen/interop/litellm/__init__.py
 create mode 100644 mm_agents/coact/autogen/interop/litellm/litellm_config_factory.py
 create mode 100644 mm_agents/coact/autogen/interop/pydantic_ai/__init__.py
 create mode 100644 mm_agents/coact/autogen/interop/pydantic_ai/pydantic_ai.py
 create mode 100644 mm_agents/coact/autogen/interop/registry.py
 create mode 100644 mm_agents/coact/autogen/io/__init__.py
 create mode 100644 mm_agents/coact/autogen/io/base.py
 create mode 100644 mm_agents/coact/autogen/io/console.py
 create mode 100644 mm_agents/coact/autogen/io/processors/__init__.py
 create mode 100644 mm_agents/coact/autogen/io/processors/base.py
 create mode 100644 mm_agents/coact/autogen/io/processors/console_event_processor.py
 create mode 100644 mm_agents/coact/autogen/io/run_response.py
 create mode 100644 mm_agents/coact/autogen/io/thread_io_stream.py
 create mode 100644 mm_agents/coact/autogen/io/websockets.py
 create mode 100644 mm_agents/coact/autogen/json_utils.py
 create mode 100644 mm_agents/coact/autogen/llm_config.py
 create mode 100644 mm_agents/coact/autogen/logger/__init__.py
 create mode 100644 mm_agents/coact/autogen/logger/base_logger.py
 create mode 100644 mm_agents/coact/autogen/logger/file_logger.py
 create mode 100644 mm_agents/coact/autogen/logger/logger_factory.py
 create mode 100644 mm_agents/coact/autogen/logger/logger_utils.py
 create mode 100644 mm_agents/coact/autogen/logger/sqlite_logger.py
 create mode 100644 mm_agents/coact/autogen/messages/__init__.py
 create mode 100644 mm_agents/coact/autogen/messages/agent_messages.py
 create mode 100644 mm_agents/coact/autogen/messages/base_message.py
 create mode 100644 mm_agents/coact/autogen/messages/client_messages.py
 create mode 100644 mm_agents/coact/autogen/messages/print_message.py
 create mode 100644 mm_agents/coact/autogen/oai/__init__.py
 create mode 100644 mm_agents/coact/autogen/oai/anthropic.py
 create mode 100644 mm_agents/coact/autogen/oai/bedrock.py
 create mode 100644 mm_agents/coact/autogen/oai/cerebras.py
 create mode 100644 mm_agents/coact/autogen/oai/client.py
 create mode 100644 mm_agents/coact/autogen/oai/client_utils.py
 create mode 100644 mm_agents/coact/autogen/oai/cohere.py
 create mode 100644 mm_agents/coact/autogen/oai/gemini.py
 create mode 100644 mm_agents/coact/autogen/oai/gemini_types.py
 create mode 100644 mm_agents/coact/autogen/oai/groq.py
 create mode 100644 mm_agents/coact/autogen/oai/mistral.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/__init__.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/_models.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/chat_completion.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/chat_completion_audio.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/chat_completion_message.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/chat_completion_message_tool_call.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/chat_completion_token_logprob.py
 create mode 100644 mm_agents/coact/autogen/oai/oai_models/completion_usage.py
 create mode 100644 mm_agents/coact/autogen/oai/ollama.py
 create mode 100644 mm_agents/coact/autogen/oai/openai_utils.py
 create mode 100644 mm_agents/coact/autogen/oai/together.py
 create mode 100644 mm_agents/coact/autogen/retrieve_utils.py
 create mode 100644 mm_agents/coact/autogen/runtime_logging.py
 create mode 100644 mm_agents/coact/autogen/token_count_utils.py
 create mode 100644 mm_agents/coact/autogen/tools/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/contrib/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/contrib/time/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/contrib/time/time.py
 create mode 100644 mm_agents/coact/autogen/tools/dependency_injection.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/browser_use/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/browser_use/browser_use.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/crawl4ai/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/crawl4ai/crawl4ai.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/deep_research/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/deep_research/deep_research.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/duckduckgo/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/duckduckgo/duckduckgo_search.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/authentication/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_hosted_provider.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_local_provider.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_provider.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/drive/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/drive/drive_functions.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/drive/toolkit.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/model.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google/toolkit_protocol.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google_search/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google_search/google_search.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/google_search/youtube_search.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/discord/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/discord/discord.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/slack/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/slack/slack.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/telegram.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/perplexity/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/perplexity/perplexity_search.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/reliable/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/reliable/reliable.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/tavily/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/tavily/tavily_search.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/web_search_preview/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/web_search_preview/web_search_preview.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/wikipedia/__init__.py
 create mode 100644 mm_agents/coact/autogen/tools/experimental/wikipedia/wikipedia.py
 create mode 100644 mm_agents/coact/autogen/tools/function_utils.py
 create mode 100644 mm_agents/coact/autogen/tools/tool.py
 create mode 100644 mm_agents/coact/autogen/tools/toolkit.py
 create mode 100644 mm_agents/coact/autogen/types.py
 create mode 100644 mm_agents/coact/coding_agent.py
 create mode 100644 mm_agents/coact/cua_agent.py
 create mode 100644 mm_agents/coact/operator_agent.py
 create mode 100644 run_coact.py

diff --git a/desktop_env/controllers/python.py b/desktop_env/controllers/python.py
index c572083..743dd09 100644
--- a/desktop_env/controllers/python.py
+++ b/desktop_env/controllers/python.py
@@ -136,6 +136,82 @@ class PythonController:
 
         logger.error("Failed to execute command.")
         return None
+    
+    def run_python_script(self, script: str) -> Optional[Dict[str, Any]]:
+        """
+        Executes a python script on the server.
+        """
+        payload = json.dumps({"code": script})
+
+        for _ in range(self.retry_times):
+            try:
+                response = requests.post(self.http_server + "/run_python", headers={'Content-Type': 'application/json'},
+                                         data=payload, timeout=90)
+                if response.status_code == 200:
+                    return response.json()
+                else:
+                    return {"status": "error", "message": "Failed to execute command.", "output": None, "error": response.json()["error"]}
+            except requests.exceptions.ReadTimeout:
+                break
+            except Exception:
+                logger.error("An error occurred while trying to execute the command: %s", traceback.format_exc())
+                logger.info("Retrying to execute command.")
+            time.sleep(self.retry_interval)
+
+        logger.error("Failed to execute command.")
+        return {"status": "error", "message": "Failed to execute command.", "output": "", "error": "Retry limit reached."}
+    
+    def run_bash_script(self, script: str, timeout: int = 30, working_dir: Optional[str] = None) -> Optional[Dict[str, Any]]:
+        """
+        Executes a bash script on the server.
+        
+        :param script: The bash script content (can be multi-line)
+        :param timeout: Execution timeout in seconds (default: 30)
+        :param working_dir: Working directory for script execution (optional)
+        :return: Dictionary with status, output, error, and returncode, or None if failed
+        """
+        payload = json.dumps({
+            "script": script,
+            "timeout": timeout,
+            "working_dir": working_dir
+        })
+
+        for _ in range(self.retry_times):
+            try:
+                response = requests.post(
+                    self.http_server + "/run_bash_script", 
+                    headers={'Content-Type': 'application/json'},
+                    data=payload, 
+                    timeout=timeout + 100  # Add buffer to HTTP timeout
+                )
+                if response.status_code == 200:
+                    result = response.json()
+                    logger.info("Bash script executed successfully with return code: %d", result.get("returncode", -1))
+                    return result
+                else:
+                    logger.error("Failed to execute bash script. Status code: %d, response: %s", 
+                                response.status_code, response.text)
+                    logger.info("Retrying to execute bash script.")
+            except requests.exceptions.ReadTimeout:
+                logger.error("Bash script execution timed out")
+                return {
+                    "status": "error",
+                    "output": "",
+                    "error": f"Script execution timed out after {timeout} seconds",
+                    "returncode": -1
+                }
+            except Exception as e:
+                logger.error("An error occurred while trying to execute the bash script: %s", e)
+                logger.info("Retrying to execute bash script.")
+            time.sleep(self.retry_interval)
+
+        logger.error("Failed to execute bash script after %d retries.", self.retry_times)
+        return {
+            "status": "error",
+            "output": "",
+            "error": f"Failed to execute bash script after {self.retry_times} retries",
+            "returncode": -1
+        }
 
     def execute_action(self, action: Dict[str, Any]):
         """
diff --git a/desktop_env/server/main.py b/desktop_env/server/main.py
index bc0d8c8..0fc4036 100644
--- a/desktop_env/server/main.py
+++ b/desktop_env/server/main.py
@@ -1568,5 +1568,230 @@ def end_recording():
         return abort(500, description=f"Recording failed. The output file is missing or empty. ffmpeg stderr: {error_output}")
 
 
+@app.route("/run_python", methods=['POST'])
+def run_python():
+    data = request.json
+    code = data.get('code', None)
+
+    if not code:
+        return jsonify({'status': 'error', 'message': 'Code not supplied!'}), 400
+
+    # Create a temporary file to save the Python code
+    import tempfile
+    import uuid
+    
+    # Generate unique filename
+    temp_filename = f"/tmp/python_exec_{uuid.uuid4().hex}.py"
+    
+    try:
+        # Write code to temporary file
+        with open(temp_filename, 'w') as f:
+            f.write(code)
+        
+        # Execute the file using subprocess to capture all output
+        result = subprocess.run(
+            ['/usr/bin/python3', temp_filename],
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            timeout=30  # 30 second timeout
+        )
+        
+        # Clean up the temporary file
+        try:
+            os.remove(temp_filename)
+        except:
+            pass  # Ignore cleanup errors
+        
+        # Prepare response
+        output = result.stdout
+        error_output = result.stderr
+        
+        # Combine output and errors if both exist
+        combined_message = output
+        if error_output:
+            combined_message += ('\n' + error_output) if output else error_output
+        
+        # Determine status based on return code and errors
+        if result.returncode != 0:
+            status = 'error'
+            if not error_output:
+                # If no stderr but non-zero return code, add a generic error message
+                error_output = f"Process exited with code {result.returncode}"
+                combined_message = combined_message + '\n' + error_output if combined_message else error_output
+        else:
+            status = 'success'
+        
+        return jsonify({
+            'status': status,
+            'message': combined_message,
+            'need_more': False,      # Not applicable for file execution
+            'output': output,        # stdout only
+            'error': error_output,   # stderr only
+            'return_code': result.returncode
+        })
+        
+    except subprocess.TimeoutExpired:
+        # Clean up the temporary file on timeout
+        try:
+            os.remove(temp_filename)
+        except:
+            pass
+            
+        return jsonify({
+            'status': 'error',
+            'message': 'Execution timeout: Code took too long to execute',
+            'error': 'TimeoutExpired',
+            'need_more': False,
+            'output': None,
+        }), 500
+        
+    except Exception as e:
+        # Clean up the temporary file on error
+        try:
+            os.remove(temp_filename)
+        except:
+            pass
+            
+        # Capture the exception details
+        return jsonify({
+            'status': 'error',
+            'message': f'Execution error: {str(e)}',
+            'error': traceback.format_exc(),
+            'need_more': False,
+            'output': None,
+        }), 500
+
+
+@app.route("/run_bash_script", methods=['POST'])
+def run_bash_script():
+    data = request.json
+    script = data.get('script', None)
+    timeout = data.get('timeout', 100)  # Default timeout of 30 seconds
+    working_dir = data.get('working_dir', None)
+    
+    if not script:
+        return jsonify({
+            'status': 'error',
+            'output': 'Script not supplied!',
+            'error': "",  # Always empty as requested
+            'returncode': -1
+        }), 400
+    
+    # Expand user directory if provided
+    if working_dir:
+        working_dir = os.path.expanduser(working_dir)
+        if not os.path.exists(working_dir):
+            return jsonify({
+                'status': 'error',
+                'output': f'Working directory does not exist: {working_dir}',
+                'error': "",  # Always empty as requested
+                'returncode': -1
+            }), 400
+    
+    # Create a temporary script file
+    import tempfile
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.sh', delete=False) as tmp_file:
+        if "#!/bin/bash" not in script:
+            script = "#!/bin/bash\n\n" + script
+        tmp_file.write(script)
+        tmp_file_path = tmp_file.name
+    
+    try:
+        # Make the script executable
+        os.chmod(tmp_file_path, 0o755)
+        
+        # Execute the script
+        if platform_name == "Windows":
+            # On Windows, use Git Bash or WSL if available, otherwise cmd
+            flags = subprocess.CREATE_NO_WINDOW
+            # Try to use bash if available (Git Bash, WSL, etc.)
+            result = subprocess.run(
+                ['bash', tmp_file_path],
+                stdout=subprocess.PIPE,
+                stderr=subprocess.STDOUT,  # Merge stderr into stdout
+                text=True,
+                timeout=timeout,
+                cwd=working_dir,
+                creationflags=flags,
+                shell=False
+            )
+        else:
+            # On Unix-like systems, use bash directly
+            flags = 0
+            result = subprocess.run(
+                ['/bin/bash', tmp_file_path],
+                stdout=subprocess.PIPE,
+                stderr=subprocess.STDOUT,  # Merge stderr into stdout
+                text=True,
+                timeout=timeout,
+                cwd=working_dir,
+                creationflags=flags,
+                shell=False
+            )
+        
+        # Log the command execution for trajectory recording
+        _append_event("BashScript", 
+                      {"script": script, "output": result.stdout, "error": "", "returncode": result.returncode}, 
+                      ts=time.time())
+        
+        return jsonify({
+            'status': 'success' if result.returncode == 0 else 'error',
+            'output': result.stdout,  # Contains both stdout and stderr merged
+            'error': "",  # Always empty as requested
+            'returncode': result.returncode
+        })
+        
+    except subprocess.TimeoutExpired:
+        return jsonify({
+            'status': 'error',
+            'output': f'Script execution timed out after {timeout} seconds',
+            'error': "",  # Always empty as requested
+            'returncode': -1
+        }), 500
+    except FileNotFoundError:
+        # Bash not found, try with sh
+        try:
+            result = subprocess.run(
+                ['sh', tmp_file_path],
+                stdout=subprocess.PIPE,
+                stderr=subprocess.STDOUT,  # Merge stderr into stdout
+                text=True,
+                timeout=timeout,
+                cwd=working_dir,
+                shell=False
+            )
+            
+            _append_event("BashScript", 
+                          {"script": script, "output": result.stdout, "error": "", "returncode": result.returncode}, 
+                          ts=time.time())
+            
+            return jsonify({
+                'status': 'success' if result.returncode == 0 else 'error',
+                'output': result.stdout,  # Contains both stdout and stderr merged
+                'error': "",  # Always empty as requested
+                'returncode': result.returncode,
+            })
+        except Exception as e:
+            return jsonify({
+                'status': 'error',
+                'output': f'Failed to execute script: {str(e)}',
+                'error': "",  # Always empty as requested
+                'returncode': -1
+            }), 500
+    except Exception as e:
+        return jsonify({
+            'status': 'error',
+            'output': f'Failed to execute script: {str(e)}',
+            'error': "",  # Always empty as requested
+            'returncode': -1
+        }), 500
+    finally:
+        # Clean up the temporary file
+        try:
+            os.unlink(tmp_file_path)
+        except:
+            pass
+
 if __name__ == '__main__':
     app.run(debug=True, host="0.0.0.0")
diff --git a/mm_agents/coact/OAI_CONFIG_LIST b/mm_agents/coact/OAI_CONFIG_LIST
new file mode 100644
index 0000000..7f96c0e
--- /dev/null
+++ b/mm_agents/coact/OAI_CONFIG_LIST
@@ -0,0 +1,27 @@
+[
+  {
+    "model": "gpt-4o",
+    "api_key": "KEY",
+    "tags": ["gpt-4o", "code", "explainer"]
+  },
+  {
+    "model": "o3",
+    "api_key": "KEY",
+    "tags": ["o3", "coding", "explainer"]
+  },
+  {
+    "model": "gpt-4.1",
+    "api_key": "KEY",
+    "tags": ["gpt-4.1", "coding", "explainer"]
+  },
+  {
+    "model": "o4-mini",
+    "api_key": "KEY",
+    "tags": ["o4-mini", "coding", "explainer"]
+  },
+  {
+    "model": "o3-mini",
+    "api_key": "KEY",
+    "tags": ["o3-mini", "coding", "explainer"]
+  }
+]
\ No newline at end of file
diff --git a/mm_agents/coact/__init__.py b/mm_agents/coact/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/mm_agents/coact/autogen/__init__.py b/mm_agents/coact/autogen/__init__.py
new file mode 100644
index 0000000..6681e5e
--- /dev/null
+++ b/mm_agents/coact/autogen/__init__.py
@@ -0,0 +1,81 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import logging
+
+from .agentchat import (
+    Agent,
+    AssistantAgent,
+    ChatResult,
+    ConversableAgent,
+    GroupChat,
+    GroupChatManager,
+    UpdateSystemMessage,
+    UserProxyAgent,
+    gather_usage_summary,
+    initiate_chats,
+    register_function,
+)
+from .agentchat.group.context_expression import ContextExpression
+from .code_utils import DEFAULT_MODEL, FAST_MODEL
+from .exception_utils import (
+    AgentNameConflictError,
+    InvalidCarryOverTypeError,
+    NoEligibleSpeakerError,
+    SenderRequiredError,
+    UndefinedNextAgentError,
+)
+from .llm_config import LLMConfig
+from .oai import (
+    Cache,
+    ModelClient,
+    OpenAIWrapper,
+    config_list_from_dotenv,
+    config_list_from_json,
+    config_list_from_models,
+    config_list_gpt4_gpt35,
+    config_list_openai_aoai,
+    filter_config,
+    get_config_list,
+)
+
+# Set the root logger.
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)
+
+
+__all__ = [
+    "DEFAULT_MODEL",
+    "FAST_MODEL",
+    "Agent",
+    "AgentNameConflictError",
+    "AssistantAgent",
+    "Cache",
+    "ChatResult",
+    "ContextExpression",
+    "ConversableAgent",
+    "GroupChat",
+    "GroupChatManager",
+    "InvalidCarryOverTypeError",
+    "LLMConfig",
+    "ModelClient",
+    "NoEligibleSpeakerError",
+    "OpenAIWrapper",
+    "SenderRequiredError",
+    "UndefinedNextAgentError",
+    "UpdateSystemMessage",
+    "UserProxyAgent",
+    "config_list_from_dotenv",
+    "config_list_from_json",
+    "config_list_from_models",
+    "config_list_gpt4_gpt35",
+    "config_list_openai_aoai",
+    "filter_config",
+    "gather_usage_summary",
+    "get_config_list",
+    "initiate_chats",
+    "register_function",
+]
diff --git a/mm_agents/coact/autogen/agentchat/__init__.py b/mm_agents/coact/autogen/agentchat/__init__.py
new file mode 100644
index 0000000..dcc4508
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/__init__.py
@@ -0,0 +1,38 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from .agent import Agent, LLMAgent
+from .assistant_agent import AssistantAgent
+from .chat import ChatResult, a_initiate_chats, initiate_chats
+
+from .conversable_agent import ConversableAgent, UpdateSystemMessage, register_function
+from .group.multi_agent_chat import a_initiate_group_chat, a_run_group_chat, initiate_group_chat, run_group_chat
+from .groupchat import GroupChat, GroupChatManager
+from .user_proxy_agent import UserProxyAgent
+from .utils import gather_usage_summary
+
+__all__ = [
+    "Agent",
+    "AssistantAgent",
+    "ChatResult",
+    "ConversableAgent",
+    "GroupChat",
+    "GroupChatManager",
+    "LLMAgent",
+    "UpdateSystemMessage",
+    "UserProxyAgent",
+    "a_initiate_chats",
+    "a_initiate_group_chat",
+    "a_initiate_swarm_chat",
+    "a_run_group_chat",
+    "a_run_swarm",
+    "gather_usage_summary",
+    "initiate_chats",
+    "initiate_group_chat",
+    "register_function",
+    "run_group_chat",
+    "run_swarm",
+]
diff --git a/mm_agents/coact/autogen/agentchat/agent.py b/mm_agents/coact/autogen/agentchat/agent.py
new file mode 100644
index 0000000..6e034e3
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/agent.py
@@ -0,0 +1,182 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import TYPE_CHECKING, Any, Optional, Protocol, TypeVar, Union, runtime_checkable
+
+from ..doc_utils import export_module
+
+__all__ = ["Agent", "LLMAgent", "LLMMessageType"]
+
+Tool = TypeVar("Tool")
+
+LLMMessageType = dict[str, Any]
+
+DEFAULT_SUMMARY_METHOD = "last_msg"
+
+
+@runtime_checkable
+@export_module("autogen")
+class Agent(Protocol):
+    """(In preview) A protocol for Agent.
+
+    An agent can communicate with other agents and perform actions.
+    Different agents can differ in what actions they perform in the `receive` method.
+    """
+
+    @property
+    def name(self) -> str:
+        """The name of the agent."""
+        ...
+
+    @property
+    def description(self) -> str:
+        """The description of the agent. Used for the agent's introduction in
+        a group chat setting.
+        """
+        ...
+
+    def send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        """Send a message to another agent.
+
+        Args:
+            message (dict or str): the message to send. If a dict, it should be
+                a JSON-serializable and follows the OpenAI's ChatCompletion schema.
+            recipient (Agent): the recipient of the message.
+            request_reply (bool): whether to request a reply from the recipient.
+        """
+        ...
+
+    async def a_send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        """(Async) Send a message to another agent.
+
+        Args:
+            message (dict or str): the message to send. If a dict, it should be
+                a JSON-serializable and follows the OpenAI's ChatCompletion schema.
+            recipient (Agent): the recipient of the message.
+            request_reply (bool): whether to request a reply from the recipient.
+        """
+        ...
+
+    def receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        """Receive a message from another agent.
+
+        Args:
+            message (dict or str): the message received. If a dict, it should be
+                a JSON-serializable and follows the OpenAI's ChatCompletion schema.
+            sender (Agent): the sender of the message.
+            request_reply (bool): whether the sender requests a reply.
+        """
+
+    async def a_receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        """(Async) Receive a message from another agent.
+
+        Args:
+            message (dict or str): the message received. If a dict, it should be
+                a JSON-serializable and follows the OpenAI's ChatCompletion schema.
+            sender (Agent): the sender of the message.
+            request_reply (bool): whether the sender requests a reply.
+        """
+        ...
+
+    def generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Union[str, dict[str, Any], None]:
+        """Generate a reply based on the received messages.
+
+        Args:
+            messages (list[dict[str, Any]]): a list of messages received from other agents.
+                The messages are dictionaries that are JSON-serializable and
+                follows the OpenAI's ChatCompletion schema.
+            sender: sender of an Agent instance.
+            **kwargs: Additional keyword arguments.
+
+        Returns:
+            str or dict or None: the generated reply. If None, no reply is generated.
+        """
+
+    async def a_generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Union[str, dict[str, Any], None]:
+        """(Async) Generate a reply based on the received messages.
+
+        Args:
+            messages (list[dict[str, Any]]): a list of messages received from other agents.
+                The messages are dictionaries that are JSON-serializable and
+                follows the OpenAI's ChatCompletion schema.
+            sender: sender of an Agent instance.
+            **kwargs: Additional keyword arguments.
+
+        Returns:
+            str or dict or None: the generated reply. If None, no reply is generated.
+        """
+        ...
+
+    def set_ui_tools(self, tools: list[Tool]) -> None:
+        """Set the UI tools for the agent.
+
+        Args:
+            tools: a list of UI tools to set.
+        """
+        ...
+
+    def unset_ui_tools(self, tools: list[Tool]) -> None:
+        """Unset the UI tools for the agent.
+
+        Args:
+            tools: a list of UI tools to set.
+        """
+        ...
+
+
+@runtime_checkable
+@export_module("autogen")
+class LLMAgent(Agent, Protocol):
+    """(In preview) A protocol for an LLM agent."""
+
+    @property
+    def system_message(self) -> str:
+        """The system message of this agent."""
+
+    def update_system_message(self, system_message: str) -> None:
+        """Update this agent's system message.
+
+        Args:
+            system_message (str): system message for inference.
+        """
+
+
+if TYPE_CHECKING:
+    # mypy will fail if Conversable agent does not implement Agent protocol
+    from .conversable_agent import ConversableAgent
+
+    def _check_protocol_implementation(agent: ConversableAgent) -> Agent:
+        return agent
diff --git a/mm_agents/coact/autogen/agentchat/assistant_agent.py b/mm_agents/coact/autogen/agentchat/assistant_agent.py
new file mode 100644
index 0000000..60cefb2
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/assistant_agent.py
@@ -0,0 +1,85 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import Any, Callable, Literal, Optional, Union
+
+from ..doc_utils import export_module
+from ..llm_config import LLMConfig
+from ..runtime_logging import log_new_agent, logging_enabled
+from .conversable_agent import ConversableAgent
+
+
+@export_module("autogen")
+class AssistantAgent(ConversableAgent):
+    """(In preview) Assistant agent, designed to solve a task with LLM.
+
+    AssistantAgent is a subclass of ConversableAgent configured with a default system message.
+    The default system message is designed to solve a task with LLM,
+    including suggesting python code blocks and debugging.
+    `human_input_mode` is default to "NEVER"
+    and `code_execution_config` is default to False.
+    This agent doesn't execute code by default, and expects the user to execute the code.
+    """
+
+    DEFAULT_SYSTEM_MESSAGE = """You are a helpful AI assistant.
+Solve tasks using your coding and language skills.
+In the following cases, suggest python code (in a python coding block) or shell script (in a sh coding block) for the user to execute.
+    1. When you need to collect info, use the code to output the info you need, for example, browse or search the web, download/read a file, print the content of a webpage or a file, get the current date/time, check the operating system. After sufficient info is printed and the task is ready to be solved based on your language skill, you can solve the task by yourself.
+    2. When you need to perform some task with code, use the code to perform the task and output the result. Finish the task smartly.
+Solve the task step by step if you need to. If a plan is not provided, explain your plan first. Be clear which step uses code, and which step uses your language skill.
+When using code, you must indicate the script type in the code block. The user cannot provide any other feedback or perform any other action beyond executing the code you suggest. The user can't modify your code. So do not suggest incomplete code which requires users to modify. Don't use a code block if it's not intended to be executed by the user.
+If you want the user to save the code in a file before executing it, put # filename: <filename> inside the code block as the first line. Don't include multiple code blocks in one response. Do not ask users to copy and paste the result. Instead, use 'print' function for the output when relevant. Check the execution result returned by the user.
+If the result indicates there is an error, fix the error and output the code again. Suggest the full code instead of partial code or code changes. If the error can't be fixed or if the task is not solved even after the code is executed successfully, analyze the problem, revisit your assumption, collect additional info you need, and think of a different approach to try.
+When you find an answer, verify the answer carefully. Include verifiable evidence in your response if possible.
+Reply "TERMINATE" in the end when everything is done.
+    """
+
+    DEFAULT_DESCRIPTION = "A helpful and general-purpose AI assistant that has strong language skills, Python skills, and Linux command line skills."
+
+    def __init__(
+        self,
+        name: str,
+        system_message: Optional[str] = DEFAULT_SYSTEM_MESSAGE,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = None,
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        human_input_mode: Literal["ALWAYS", "NEVER", "TERMINATE"] = "NEVER",
+        description: Optional[str] = None,
+        **kwargs: Any,
+    ):
+        """Args:
+        name (str): agent name.
+        system_message (str): system message for the ChatCompletion inference.
+            Please override this attribute if you want to reprogram the agent.
+        llm_config (dict or False or None): llm inference configuration.
+            Please refer to [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create)
+            for available options.
+        is_termination_msg (function): a function that takes a message in the form of a dictionary
+            and returns a boolean value indicating if this received message is a termination message.
+            The dict can contain the following keys: "content", "role", "name", "function_call".
+        max_consecutive_auto_reply (int): the maximum number of consecutive auto replies.
+            default to None (no limit provided, class attribute MAX_CONSECUTIVE_AUTO_REPLY will be used as the limit in this case).
+            The limit only plays a role when human_input_mode is not "ALWAYS".
+        **kwargs (dict): Please refer to other kwargs in
+            [ConversableAgent](https://docs.ag2.ai/latest/docs/api-reference/autogen/ConversableAgent).
+        """
+        super().__init__(
+            name,
+            system_message,
+            is_termination_msg,
+            max_consecutive_auto_reply,
+            human_input_mode,
+            llm_config=llm_config,
+            description=description,
+            **kwargs,
+        )
+        if logging_enabled():
+            log_new_agent(self, locals())
+
+        # Update the provided description if None, and we are using the default system_message,
+        # then use the default description.
+        if description is None and system_message == self.DEFAULT_SYSTEM_MESSAGE:
+            self.description = self.DEFAULT_DESCRIPTION
diff --git a/mm_agents/coact/autogen/agentchat/chat.py b/mm_agents/coact/autogen/agentchat/chat.py
new file mode 100644
index 0000000..0577d7b
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/chat.py
@@ -0,0 +1,309 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import asyncio
+import datetime
+import logging
+import warnings
+from collections import defaultdict
+from dataclasses import dataclass
+from functools import partial
+from typing import Any
+
+from ..doc_utils import export_module
+from ..events.agent_events import PostCarryoverProcessingEvent
+from ..io.base import IOStream
+from .utils import consolidate_chat_info
+
+logger = logging.getLogger(__name__)
+Prerequisite = tuple[int, int]
+
+__all__ = ["ChatResult", "a_initiate_chats", "initiate_chats"]
+
+
+@dataclass
+@export_module("autogen")
+class ChatResult:
+    """(Experimental) The result of a chat. Almost certain to be changed."""
+
+    chat_id: int = None
+    """chat id"""
+    chat_history: list[dict[str, Any]] = None
+    """The chat history."""
+    summary: str = None
+    """A summary obtained from the chat."""
+    cost: dict[str, dict[str, Any]] = (
+        None  # keys: "usage_including_cached_inference", "usage_excluding_cached_inference"
+    )
+    """The cost of the chat.
+       The value for each usage type is a dictionary containing cost information for that specific type.
+           - "usage_including_cached_inference": Cost information on the total usage, including the tokens in cached inference.
+           - "usage_excluding_cached_inference": Cost information on the usage of tokens, excluding the tokens in cache. No larger than "usage_including_cached_inference".
+    """
+    human_input: list[str] = None
+    """A list of human input solicited during the chat."""
+
+
+def _validate_recipients(chat_queue: list[dict[str, Any]]) -> None:
+    """Validate recipients exits and warn repetitive recipients."""
+    receipts_set = set()
+    for chat_info in chat_queue:
+        assert "recipient" in chat_info, "recipient must be provided."
+        receipts_set.add(chat_info["recipient"])
+    if len(receipts_set) < len(chat_queue):
+        warnings.warn(
+            "Repetitive recipients detected: The chat history will be cleared by default if a recipient appears more than once. To retain the chat history, please set 'clear_history=False' in the configuration of the repeating agent.",
+            UserWarning,
+        )
+
+
+def __create_async_prerequisites(chat_queue: list[dict[str, Any]]) -> list[Prerequisite]:
+    """Create list of Prerequisite (prerequisite_chat_id, chat_id)"""
+    prerequisites = []
+    for chat_info in chat_queue:
+        if "chat_id" not in chat_info:
+            raise ValueError("Each chat must have a unique id for async multi-chat execution.")
+        chat_id = chat_info["chat_id"]
+        pre_chats = chat_info.get("prerequisites", [])
+        for pre_chat_id in pre_chats:
+            if not isinstance(pre_chat_id, int):
+                raise ValueError("Prerequisite chat id is not int.")
+            prerequisites.append((chat_id, pre_chat_id))
+    return prerequisites
+
+
+def __find_async_chat_order(chat_ids: set[int], prerequisites: list[Prerequisite]) -> list[int]:
+    """Find chat order for async execution based on the prerequisite chats
+
+    Args:
+        chat_ids: A set of all chat IDs that need to be scheduled
+        prerequisites: A list of tuples (chat_id, prerequisite_chat_id) where each tuple indicates that chat_id depends on prerequisite_chat_id
+
+    Returns:
+        list: a list of chat_id in order.
+    """
+    edges = defaultdict(set)
+    indegree = defaultdict(int)
+    for pair in prerequisites:
+        chat, pre = pair[0], pair[1]
+        if chat not in edges[pre]:
+            indegree[chat] += 1
+            edges[pre].add(chat)
+    bfs = [i for i in chat_ids if i not in indegree]
+    chat_order = []
+    steps = len(indegree)
+    for _ in range(steps + 1):
+        if not bfs:
+            break
+        chat_order.extend(bfs)
+        nxt = []
+        for node in bfs:
+            if node in edges:
+                for course in edges[node]:
+                    indegree[course] -= 1
+                    if indegree[course] == 0:
+                        nxt.append(course)
+                        indegree.pop(course)
+                edges.pop(node)
+        bfs = nxt
+
+    if indegree:
+        return []
+    return chat_order
+
+
+def _post_process_carryover_item(carryover_item):
+    if isinstance(carryover_item, str):
+        return carryover_item
+    elif isinstance(carryover_item, dict) and "content" in carryover_item:
+        return str(carryover_item["content"])
+    else:
+        return str(carryover_item)
+
+
+def __post_carryover_processing(chat_info: dict[str, Any]) -> None:
+    iostream = IOStream.get_default()
+
+    if "message" not in chat_info:
+        warnings.warn(
+            "message is not provided in a chat_queue entry. input() will be called to get the initial message.",
+            UserWarning,
+        )
+
+    iostream.send(PostCarryoverProcessingEvent(chat_info=chat_info))
+
+
+@export_module("autogen")
+def initiate_chats(chat_queue: list[dict[str, Any]]) -> list[ChatResult]:
+    """Initiate a list of chats.
+
+    Args:
+        chat_queue (List[Dict]): A list of dictionaries containing the information about the chats.
+
+            Each dictionary should contain the input arguments for
+            [`ConversableAgent.initiate_chat`](../ConversableAgent#initiate-chat).
+            For example:
+                - `"sender"` - the sender agent.
+                - `"recipient"` - the recipient agent.
+                - `"clear_history"` (bool) - whether to clear the chat history with the agent.
+                Default is True.
+                - `"silent"` (bool or None) - (Experimental) whether to print the messages in this
+                conversation. Default is False.
+                - `"cache"` (Cache or None) - the cache client to use for this conversation.
+                Default is None.
+                - `"max_turns"` (int or None) - maximum number of turns for the chat. If None, the chat
+                will continue until a termination condition is met. Default is None.
+                - `"summary_method"` (str or callable) - a string or callable specifying the method to get
+                a summary from the chat. Default is DEFAULT_summary_method, i.e., "last_msg".
+                - `"summary_args"` (dict) - a dictionary of arguments to be passed to the summary_method.
+                Default is {}.
+                - `"message"` (str, callable or None) - if None, input() will be called to get the
+                initial message.
+                - `**context` - additional context information to be passed to the chat.
+                - `"carryover"` - It can be used to specify the carryover information to be passed
+                to this chat. If provided, we will combine this carryover with the "message" content when
+                generating the initial chat message in `generate_init_message`.
+                - `"finished_chat_indexes_to_exclude_from_carryover"` - It can be used by specifying a list of indexes of the finished_chats list,
+                from which to exclude the summaries for carryover. If 'finished_chat_indexes_to_exclude_from_carryover' is not provided or an empty list,
+                then summary from all the finished chats will be taken.
+
+    Returns:
+        (list): a list of ChatResult objects corresponding to the finished chats in the chat_queue.
+    """
+    consolidate_chat_info(chat_queue)
+    _validate_recipients(chat_queue)
+    current_chat_queue = chat_queue.copy()
+    finished_chats = []
+    while current_chat_queue:
+        chat_info = current_chat_queue.pop(0)
+        _chat_carryover = chat_info.get("carryover", [])
+        finished_chat_indexes_to_exclude_from_carryover = chat_info.get(
+            "finished_chat_indexes_to_exclude_from_carryover", []
+        )
+
+        if isinstance(_chat_carryover, str):
+            _chat_carryover = [_chat_carryover]
+        chat_info["carryover"] = _chat_carryover + [
+            r.summary for i, r in enumerate(finished_chats) if i not in finished_chat_indexes_to_exclude_from_carryover
+        ]
+
+        if not chat_info.get("silent", False):
+            __post_carryover_processing(chat_info)
+
+        sender = chat_info["sender"]
+        chat_res = sender.initiate_chat(**chat_info)
+        finished_chats.append(chat_res)
+    return finished_chats
+
+
+def __system_now_str():
+    ct = datetime.datetime.now()
+    return f" System time at {ct}. "
+
+
+def _on_chat_future_done(chat_future: asyncio.Future, chat_id: int):
+    """Update ChatResult when async Task for Chat is completed."""
+    logger.debug(f"Update chat {chat_id} result on task completion." + __system_now_str())
+    chat_result = chat_future.result()
+    chat_result.chat_id = chat_id
+
+
+async def _dependent_chat_future(
+    chat_id: int, chat_info: dict[str, Any], prerequisite_chat_futures: dict[int, asyncio.Future]
+) -> asyncio.Task:
+    """Create an async Task for each chat."""
+    logger.debug(f"Create Task for chat {chat_id}." + __system_now_str())
+    _chat_carryover = chat_info.get("carryover", [])
+    finished_chat_indexes_to_exclude_from_carryover = chat_info.get(
+        "finished_chat_indexes_to_exclude_from_carryover", []
+    )
+    finished_chats = dict()
+    for chat in prerequisite_chat_futures:
+        chat_future = prerequisite_chat_futures[chat]
+        if chat_future.cancelled():
+            raise RuntimeError(f"Chat {chat} is cancelled.")
+
+        # wait for prerequisite chat results for the new chat carryover
+        finished_chats[chat] = await chat_future
+
+    if isinstance(_chat_carryover, str):
+        _chat_carryover = [_chat_carryover]
+    data = [
+        chat_result.summary
+        for chat_id, chat_result in finished_chats.items()
+        if chat_id not in finished_chat_indexes_to_exclude_from_carryover
+    ]
+    chat_info["carryover"] = _chat_carryover + data
+    if not chat_info.get("silent", False):
+        __post_carryover_processing(chat_info)
+
+    sender = chat_info["sender"]
+    chat_res_future = asyncio.create_task(sender.a_initiate_chat(**chat_info))
+    call_back_with_args = partial(_on_chat_future_done, chat_id=chat_id)
+    chat_res_future.add_done_callback(call_back_with_args)
+    logger.debug(f"Task for chat {chat_id} created." + __system_now_str())
+    return chat_res_future
+
+
+async def a_initiate_chats(chat_queue: list[dict[str, Any]]) -> dict[int, ChatResult]:
+    """(async) Initiate a list of chats.
+
+    Args:
+        chat_queue (List[Dict]): A list of dictionaries containing the information about the chats.
+
+            Each dictionary should contain the input arguments for
+            [`ConversableAgent.initiate_chat`](../../../ConversableAgent#initiate-chat).
+            For example:
+                - `"sender"` - the sender agent.
+                - `"recipient"` - the recipient agent.
+                - `"clear_history"` (bool) - whether to clear the chat history with the agent.
+                Default is True.
+                - `"silent"` (bool or None) - (Experimental) whether to print the messages in this
+                conversation. Default is False.
+                - `"cache"` (Cache or None) - the cache client to use for this conversation.
+                Default is None.
+                - `"max_turns"` (int or None) - maximum number of turns for the chat. If None, the chat
+                will continue until a termination condition is met. Default is None.
+                - `"summary_method"` (str or callable) - a string or callable specifying the method to get
+                a summary from the chat. Default is DEFAULT_summary_method, i.e., "last_msg".
+                - `"summary_args"` (dict) - a dictionary of arguments to be passed to the summary_method.
+                Default is {}.
+                - `"message"` (str, callable or None) - if None, input() will be called to get the
+                initial message.
+                - `**context` - additional context information to be passed to the chat.
+                - `"carryover"` - It can be used to specify the carryover information to be passed
+                to this chat. If provided, we will combine this carryover with the "message" content when
+                generating the initial chat message in `generate_init_message`.
+                - `"finished_chat_indexes_to_exclude_from_carryover"` - It can be used by specifying a list of indexes of the finished_chats list,
+                from which to exclude the summaries for carryover. If 'finished_chat_indexes_to_exclude_from_carryover' is not provided or an empty list,
+                then summary from all the finished chats will be taken.
+
+
+    Returns:
+        - (Dict): a dict of ChatId: ChatResult corresponding to the finished chats in the chat_queue.
+    """
+    consolidate_chat_info(chat_queue)
+    _validate_recipients(chat_queue)
+    chat_book = {chat_info["chat_id"]: chat_info for chat_info in chat_queue}
+    num_chats = chat_book.keys()
+    prerequisites = __create_async_prerequisites(chat_queue)
+    chat_order_by_id = __find_async_chat_order(num_chats, prerequisites)
+    finished_chat_futures = dict()
+    for chat_id in chat_order_by_id:
+        chat_info = chat_book[chat_id]
+        prerequisite_chat_ids = chat_info.get("prerequisites", [])
+        pre_chat_futures = dict()
+        for pre_chat_id in prerequisite_chat_ids:
+            pre_chat_future = finished_chat_futures[pre_chat_id]
+            pre_chat_futures[pre_chat_id] = pre_chat_future
+        current_chat_future = await _dependent_chat_future(chat_id, chat_info, pre_chat_futures)
+        finished_chat_futures[chat_id] = current_chat_future
+    await asyncio.gather(*list(finished_chat_futures.values()))
+    finished_chats = dict()
+    for chat in finished_chat_futures:
+        chat_result = finished_chat_futures[chat].result()
+        finished_chats[chat] = chat_result
+    return finished_chats
diff --git a/mm_agents/coact/autogen/agentchat/contrib/__init__.py b/mm_agents/coact/autogen/agentchat/contrib/__init__.py
new file mode 100644
index 0000000..a80fb86
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/__init__.py
@@ -0,0 +1,5 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+__all__: list[str] = []
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/__init__.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/__init__.py
new file mode 100644
index 0000000..a80fb86
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/__init__.py
@@ -0,0 +1,5 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+__all__: list[str] = []
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/agent_capability.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/agent_capability.py
new file mode 100644
index 0000000..ee7bdf7
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/agent_capability.py
@@ -0,0 +1,20 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from ...assistant_agent import ConversableAgent
+
+
+class AgentCapability:
+    """Base class for composable capabilities that can be added to an agent."""
+
+    def __init__(self):
+        pass
+
+    def add_to_agent(self, agent: ConversableAgent):
+        """Adds a particular capability to the given agent. Must be implemented by the capability subclass.
+        An implementation will typically call agent.register_hook() one or more times. See teachability.py as an example.
+        """
+        raise NotImplementedError
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/generate_images.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/generate_images.py
new file mode 100644
index 0000000..d98eb58
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/generate_images.py
@@ -0,0 +1,301 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import re
+from typing import Any, Literal, Optional, Protocol, Union
+
+from .... import Agent, ConversableAgent, code_utils
+from ....cache import AbstractCache
+from ....import_utils import optional_import_block, require_optional_import
+from ....llm_config import LLMConfig
+from .. import img_utils
+from ..capabilities.agent_capability import AgentCapability
+from ..text_analyzer_agent import TextAnalyzerAgent
+
+with optional_import_block():
+    from PIL.Image import Image
+    from openai import OpenAI
+
+SYSTEM_MESSAGE = "You've been given the special ability to generate images."
+DESCRIPTION_MESSAGE = "This agent has the ability to generate images."
+
+PROMPT_INSTRUCTIONS = """In detail, please summarize the provided prompt to generate the image described in the TEXT.
+DO NOT include any advice. RESPOND like the following example:
+EXAMPLE: Blue background, 3D shapes, ...
+"""
+
+
+class ImageGenerator(Protocol):
+    """This class defines an interface for image generators.
+
+    Concrete implementations of this protocol must provide a `generate_image` method that takes a string prompt as
+    input and returns a PIL Image object.
+
+    NOTE: Current implementation does not allow you to edit a previously existing image.
+    """
+
+    def generate_image(self, prompt: str) -> "Image":
+        """Generates an image based on the provided prompt.
+
+        Args:
+          prompt: A string describing the desired image.
+
+        Returns:
+          A PIL Image object representing the generated image.
+
+        Raises:
+          ValueError: If the image generation fails.
+        """
+        ...
+
+    def cache_key(self, prompt: str) -> str:
+        """Generates a unique cache key for the given prompt.
+
+        This key can be used to store and retrieve generated images based on the prompt.
+
+        Args:
+          prompt: A string describing the desired image.
+
+        Returns:
+          A unique string that can be used as a cache key.
+        """
+        ...
+
+
+@require_optional_import("PIL", "unknown")
+@require_optional_import("openai>=1.66.2", "openai")
+class DalleImageGenerator:
+    """Generates images using OpenAI's DALL-E models.
+
+    This class provides a convenient interface for generating images based on textual prompts using OpenAI's DALL-E
+    models. It allows you to specify the DALL-E model, resolution, quality, and the number of images to generate.
+
+    Note: Current implementation does not allow you to edit a previously existing image.
+    """
+
+    def __init__(
+        self,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        resolution: Literal["256x256", "512x512", "1024x1024", "1792x1024", "1024x1792"] = "1024x1024",
+        quality: Literal["standard", "hd"] = "standard",
+        num_images: int = 1,
+    ):
+        """Args:
+        llm_config (LLMConfig or dict): llm config, must contain a valid dalle model and OpenAI API key in config_list.
+        resolution (str): The resolution of the image you want to generate. Must be one of "256x256", "512x512", "1024x1024", "1792x1024", "1024x1792".
+        quality (str): The quality of the image you want to generate. Must be one of "standard", "hd".
+        num_images (int): The number of images to generate.
+        """
+        config_list = llm_config["config_list"]
+        _validate_dalle_model(config_list[0]["model"])
+        _validate_resolution_format(resolution)
+
+        self._model = config_list[0]["model"]
+        self._resolution = resolution
+        self._quality = quality
+        self._num_images = num_images
+        self._dalle_client = OpenAI(api_key=config_list[0]["api_key"])
+
+    def generate_image(self, prompt: str) -> "Image":
+        response = self._dalle_client.images.generate(
+            model=self._model,
+            prompt=prompt,
+            size=self._resolution,
+            quality=self._quality,
+            n=self._num_images,
+        )
+
+        image_url = response.data[0].url
+        if image_url is None:
+            raise ValueError("Failed to generate image.")
+
+        return img_utils.get_pil_image(image_url)
+
+    def cache_key(self, prompt: str) -> str:
+        keys = (prompt, self._model, self._resolution, self._quality, self._num_images)
+        return ",".join([str(k) for k in keys])
+
+
+@require_optional_import("PIL", "unknown")
+class ImageGeneration(AgentCapability):
+    """This capability allows a ConversableAgent to generate images based on the message received from other Agents.
+
+    1. Utilizes a TextAnalyzerAgent to analyze incoming messages to identify requests for image generation and
+        extract relevant details.
+    2. Leverages the provided ImageGenerator (e.g., DalleImageGenerator) to create the image.
+    3. Optionally caches generated images for faster retrieval in future conversations.
+
+    NOTE: This capability increases the token usage of the agent, as it uses TextAnalyzerAgent to analyze every
+        message received by the agent.
+
+    Example:
+        ```python
+        import autogen
+        from autogen.agentchat.contrib.capabilities.image_generation import ImageGeneration
+
+        # Assuming you have llm configs configured for the LLMs you want to use and Dalle.
+        # Create the agent
+        agent = autogen.ConversableAgent(
+            name="dalle", llm_config={...}, max_consecutive_auto_reply=3, human_input_mode="NEVER"
+        )
+
+        # Create an ImageGenerator with desired settings
+        dalle_gen = generate_images.DalleImageGenerator(llm_config={...})
+
+        # Add the ImageGeneration capability to the agent
+        agent.add_capability(ImageGeneration(image_generator=dalle_gen))
+        ```
+    """
+
+    def __init__(
+        self,
+        image_generator: ImageGenerator,
+        cache: Optional[AbstractCache] = None,
+        text_analyzer_llm_config: Optional[Union[LLMConfig, dict[str, Any]]] = None,
+        text_analyzer_instructions: str = PROMPT_INSTRUCTIONS,
+        verbosity: int = 0,
+        register_reply_position: int = 2,
+    ):
+        """Args:
+        image_generator (ImageGenerator): The image generator you would like to use to generate images.
+        cache (None or AbstractCache): The cache client to use to store and retrieve generated images. If None,
+            no caching will be used.
+        text_analyzer_llm_config (LLMConfig or Dict or None): The LLM config for the text analyzer. If None, the LLM config will
+            be retrieved from the agent you're adding the ability to.
+        text_analyzer_instructions (str): Instructions provided to the TextAnalyzerAgent used to analyze
+            incoming messages and extract the prompt for image generation. The default instructions focus on
+            summarizing the prompt. You can customize the instructions to achieve more granular control over prompt
+            extraction.
+            Example: 'Extract specific details from the message, like desired objects, styles, or backgrounds.'
+        verbosity (int): The verbosity level. Defaults to 0 and must be greater than or equal to 0. The text
+            analyzer llm calls will be silent if verbosity is less than 2.
+        register_reply_position (int): The position of the reply function in the agent's list of reply functions.
+            This capability registers a new reply function to handle messages with image generation requests.
+            Defaults to 2 to place it after the check termination and human reply for a ConversableAgent.
+        """
+        self._image_generator = image_generator
+        self._cache = cache
+        self._text_analyzer_llm_config = text_analyzer_llm_config
+        self._text_analyzer_instructions = text_analyzer_instructions
+        self._verbosity = verbosity
+        self._register_reply_position = register_reply_position
+
+        self._agent: Optional[ConversableAgent] = None
+        self._text_analyzer: Optional[TextAnalyzerAgent] = None
+
+    def add_to_agent(self, agent: ConversableAgent):
+        """Adds the Image Generation capability to the specified ConversableAgent.
+
+        This function performs the following modifications to the agent:
+
+        1. Registers a reply function: A new reply function is registered with the agent to handle messages that
+           potentially request image generation. This function analyzes the message and triggers image generation if
+           necessary.
+        2. Creates an Agent (TextAnalyzerAgent): This is used to analyze messages for image generation requirements.
+        3. Updates System Message: The agent's system message is updated to include a message indicating the
+           capability to generate images has been added.
+        4. Updates Description: The agent's description is updated to reflect the addition of the Image Generation
+           capability. This might be helpful in certain use cases, like group chats.
+
+        Args:
+          agent (ConversableAgent): The ConversableAgent to add the capability to.
+        """
+        self._agent = agent
+
+        agent.register_reply([Agent, None], self._image_gen_reply, position=self._register_reply_position)
+
+        self._text_analyzer_llm_config = self._text_analyzer_llm_config or agent.llm_config
+        self._text_analyzer = TextAnalyzerAgent(llm_config=self._text_analyzer_llm_config)
+
+        agent.update_system_message(agent.system_message + "\n" + SYSTEM_MESSAGE)
+        agent.description += "\n" + DESCRIPTION_MESSAGE
+
+    def _image_gen_reply(
+        self,
+        recipient: ConversableAgent,
+        messages: Optional[list[dict[str, Any]]],
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        if messages is None:
+            return False, None
+
+        last_message = code_utils.content_str(messages[-1]["content"])
+
+        if not last_message:
+            return False, None
+
+        if self._should_generate_image(last_message):
+            prompt = self._extract_prompt(last_message)
+
+            image = self._cache_get(prompt)
+            if image is None:
+                image = self._image_generator.generate_image(prompt)
+                self._cache_set(prompt, image)
+
+            return True, self._generate_content_message(prompt, image)
+
+        else:
+            return False, None
+
+    def _should_generate_image(self, message: str) -> bool:
+        assert self._text_analyzer is not None
+
+        instructions = """
+        Does any part of the TEXT ask the agent to generate an image?
+        The TEXT must explicitly mention that the image must be generated.
+        Answer with just one word, yes or no.
+        """
+        analysis = self._text_analyzer.analyze_text(message, instructions)
+
+        return "yes" in self._extract_analysis(analysis).lower()
+
+    def _extract_prompt(self, last_message) -> str:
+        assert self._text_analyzer is not None
+
+        analysis = self._text_analyzer.analyze_text(last_message, self._text_analyzer_instructions)
+        return self._extract_analysis(analysis)
+
+    def _cache_get(self, prompt: str) -> Optional["Image"]:
+        if self._cache:
+            key = self._image_generator.cache_key(prompt)
+            cached_value = self._cache.get(key)
+
+            if cached_value:
+                return img_utils.get_pil_image(cached_value)
+
+    def _cache_set(self, prompt: str, image: "Image"):
+        if self._cache:
+            key = self._image_generator.cache_key(prompt)
+            self._cache.set(key, img_utils.pil_to_data_uri(image))
+
+    def _extract_analysis(self, analysis: Optional[Union[str, dict[str, Any]]]) -> str:
+        if isinstance(analysis, dict):
+            return code_utils.content_str(analysis["content"])
+        else:
+            return code_utils.content_str(analysis)
+
+    def _generate_content_message(self, prompt: str, image: "Image") -> dict[str, Any]:
+        return {
+            "content": [
+                {"type": "text", "text": f"I generated an image with the prompt: {prompt}"},
+                {"type": "image_url", "image_url": {"url": img_utils.pil_to_data_uri(image)}},
+            ]
+        }
+
+
+# Helpers
+def _validate_resolution_format(resolution: str):
+    """Checks if a string is in a valid resolution format (e.g., "1024x768")."""
+    pattern = r"^\d+x\d+$"  # Matches a pattern of digits, "x", and digits
+    matched_resolution = re.match(pattern, resolution)
+    if matched_resolution is None:
+        raise ValueError(f"Invalid resolution format: {resolution}")
+
+
+def _validate_dalle_model(model: str):
+    if model not in ["dall-e-3", "dall-e-2"]:
+        raise ValueError(f"Invalid DALL-E model: {model}. Must be 'dall-e-3' or 'dall-e-2'")
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/teachability.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/teachability.py
new file mode 100644
index 0000000..b6e6634
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/teachability.py
@@ -0,0 +1,393 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import os
+import pickle
+from typing import Any, Optional, Union
+
+from ....formatting_utils import colored
+from ....import_utils import optional_import_block, require_optional_import
+from ....llm_config import LLMConfig
+from ...assistant_agent import ConversableAgent
+from ..text_analyzer_agent import TextAnalyzerAgent
+from .agent_capability import AgentCapability
+
+with optional_import_block():
+    import chromadb
+    from chromadb.config import Settings
+
+
+class Teachability(AgentCapability):
+    """Teachability uses a vector database to give an agent the ability to remember user teachings,
+    where the user is any caller (human or not) sending messages to the teachable agent.
+    Teachability is designed to be composable with other agent capabilities.
+    To make any conversable agent teachable, instantiate both the agent and the Teachability class,
+    then pass the agent to teachability.add_to_agent(agent).
+    Note that teachable agents in a group chat must be given unique path_to_db_dir values.
+
+    When adding Teachability to an agent, the following are modified:
+    - The agent's system message is appended with a note about the agent's new ability.
+    - A hook is added to the agent's `process_last_received_message` hookable method,
+    and the hook potentially modifies the last of the received messages to include earlier teachings related to the message.
+    Added teachings do not propagate into the stored message history.
+    If new user teachings are detected, they are added to new memos in the vector database.
+    """
+
+    def __init__(
+        self,
+        verbosity: Optional[int] = 0,
+        reset_db: Optional[bool] = False,
+        path_to_db_dir: Optional[str] = "./tmp/teachable_agent_db",
+        recall_threshold: Optional[float] = 1.5,
+        max_num_retrievals: Optional[int] = 10,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], bool]] = None,
+    ):
+        """Args:
+        verbosity (Optional, int): # 0 (default) for basic info, 1 to add memory operations, 2 for analyzer messages, 3 for memo lists.
+        reset_db (Optional, bool): True to clear the DB before starting. Default False.
+        path_to_db_dir (Optional, str): path to the directory where this particular agent's DB is stored. Default "./tmp/teachable_agent_db"
+        recall_threshold (Optional, float): The maximum distance for retrieved memos, where 0.0 is exact match. Default 1.5. Larger values allow more (but less relevant) memos to be recalled.
+        max_num_retrievals (Optional, int): The maximum number of memos to retrieve from the DB. Default 10.
+        llm_config (LLMConfig or dict or False): llm inference configuration passed to TextAnalyzerAgent.
+            If None, TextAnalyzerAgent uses llm_config from the teachable agent.
+        """
+        self.verbosity = verbosity
+        self.path_to_db_dir = path_to_db_dir
+        self.recall_threshold = recall_threshold
+        self.max_num_retrievals = max_num_retrievals
+        self.llm_config = llm_config
+
+        self.analyzer = None
+        self.teachable_agent = None
+
+        # Create the memo store.
+        self.memo_store = MemoStore(self.verbosity, reset_db, self.path_to_db_dir)
+
+    def add_to_agent(self, agent: ConversableAgent):
+        """Adds teachability to the given agent."""
+        self.teachable_agent = agent
+
+        # Register a hook for processing the last message.
+        agent.register_hook(hookable_method="process_last_received_message", hook=self.process_last_received_message)
+
+        # Was an llm_config passed to the constructor?
+        if self.llm_config is None:
+            # No. Use the agent's llm_config.
+            self.llm_config = agent.llm_config
+        assert self.llm_config, "Teachability requires a valid llm_config."
+
+        # Create the analyzer agent.
+        self.analyzer = TextAnalyzerAgent(llm_config=self.llm_config)
+
+        # Append extra info to the system message.
+        agent.update_system_message(
+            agent.system_message
+            + "\nYou've been given the special ability to remember user teachings from prior conversations."
+        )
+
+    def prepopulate_db(self):
+        """Adds a few arbitrary memos to the DB."""
+        self.memo_store.prepopulate()
+
+    def process_last_received_message(self, text: Union[dict[str, Any], str]):
+        """Appends any relevant memos to the message text, and stores any apparent teachings in new memos.
+        Uses TextAnalyzerAgent to make decisions about memo storage and retrieval.
+        """
+        # Try to retrieve relevant memos from the DB.
+        expanded_text = text
+        if self.memo_store.last_memo_id > 0:
+            expanded_text = self._consider_memo_retrieval(text)
+
+        # Try to store any user teachings in new memos to be used in the future.
+        self._consider_memo_storage(text)
+
+        # Return the (possibly) expanded message text.
+        return expanded_text
+
+    def _consider_memo_storage(self, comment: Union[dict[str, Any], str]):
+        """Decides whether to store something from one user comment in the DB."""
+        memo_added = False
+
+        # Check for a problem-solution pair.
+        response = self._analyze(
+            comment,
+            "Does any part of the TEXT ask the agent to perform a task or solve a problem? Answer with just one word, yes or no.",
+        )
+        if "yes" in response.lower():
+            # Can we extract advice?
+            advice = self._analyze(
+                comment,
+                "Briefly copy any advice from the TEXT that may be useful for a similar but different task in the future. But if no advice is present, just respond with 'none'.",
+            )
+            if "none" not in advice.lower():
+                # Yes. Extract the task.
+                task = self._analyze(
+                    comment,
+                    "Briefly copy just the task from the TEXT, then stop. Don't solve it, and don't include any advice.",
+                )
+                # Generalize the task.
+                general_task = self._analyze(
+                    task,
+                    "Summarize very briefly, in general terms, the type of task described in the TEXT. Leave out details that might not appear in a similar problem.",
+                )
+                # Add the task-advice (problem-solution) pair to the vector DB.
+                if self.verbosity >= 1:
+                    print(colored("\nREMEMBER THIS TASK-ADVICE PAIR", "light_yellow"))
+                self.memo_store.add_input_output_pair(general_task, advice)
+                memo_added = True
+
+        # Check for information to be learned.
+        response = self._analyze(
+            comment,
+            "Does the TEXT contain information that could be committed to memory? Answer with just one word, yes or no.",
+        )
+        if "yes" in response.lower():
+            # Yes. What question would this information answer?
+            question = self._analyze(
+                comment,
+                "Imagine that the user forgot this information in the TEXT. How would they ask you for this information? Include no other text in your response.",
+            )
+            # Extract the information.
+            answer = self._analyze(
+                comment, "Copy the information from the TEXT that should be committed to memory. Add no explanation."
+            )
+            # Add the question-answer pair to the vector DB.
+            if self.verbosity >= 1:
+                print(colored("\nREMEMBER THIS QUESTION-ANSWER PAIR", "light_yellow"))
+            self.memo_store.add_input_output_pair(question, answer)
+            memo_added = True
+
+        # Were any memos added?
+        if memo_added:
+            # Yes. Save them to disk.
+            self.memo_store._save_memos()
+
+    def _consider_memo_retrieval(self, comment: Union[dict[str, Any], str]):
+        """Decides whether to retrieve memos from the DB, and add them to the chat context."""
+        # First, use the comment directly as the lookup key.
+        if self.verbosity >= 1:
+            print(colored("\nLOOK FOR RELEVANT MEMOS, AS QUESTION-ANSWER PAIRS", "light_yellow"))
+        memo_list = self._retrieve_relevant_memos(comment)
+
+        # Next, if the comment involves a task, then extract and generalize the task before using it as the lookup key.
+        response = self._analyze(
+            comment,
+            "Does any part of the TEXT ask the agent to perform a task or solve a problem? Answer with just one word, yes or no.",
+        )
+        if "yes" in response.lower():
+            if self.verbosity >= 1:
+                print(colored("\nLOOK FOR RELEVANT MEMOS, AS TASK-ADVICE PAIRS", "light_yellow"))
+            # Extract the task.
+            task = self._analyze(
+                comment, "Copy just the task from the TEXT, then stop. Don't solve it, and don't include any advice."
+            )
+            # Generalize the task.
+            general_task = self._analyze(
+                task,
+                "Summarize very briefly, in general terms, the type of task described in the TEXT. Leave out details that might not appear in a similar problem.",
+            )
+            # Append any relevant memos.
+            memo_list.extend(self._retrieve_relevant_memos(general_task))
+
+        # De-duplicate the memo list.
+        memo_list = list(set(memo_list))
+
+        # Append the memos to the text of the last message.
+        return comment + self._concatenate_memo_texts(memo_list)
+
+    def _retrieve_relevant_memos(self, input_text: str) -> list:
+        """Returns semantically related memos from the DB."""
+        memo_list = self.memo_store.get_related_memos(
+            input_text, n_results=self.max_num_retrievals, threshold=self.recall_threshold
+        )
+
+        if self.verbosity >= 1:  # noqa: SIM102
+            # Was anything retrieved?
+            if len(memo_list) == 0:
+                # No. Look at the closest memo.
+                print(colored("\nTHE CLOSEST MEMO IS BEYOND THE THRESHOLD:", "light_yellow"))
+                self.memo_store.get_nearest_memo(input_text)
+                print()  # Print a blank line. The memo details were printed by get_nearest_memo().
+
+        # Create a list of just the memo output_text strings.
+        memo_list = [memo[1] for memo in memo_list]
+        return memo_list
+
+    def _concatenate_memo_texts(self, memo_list: list) -> str:
+        """Concatenates the memo texts into a single string for inclusion in the chat context."""
+        memo_texts = ""
+        if len(memo_list) > 0:
+            info = "\n# Memories that might help\n"
+            for memo in memo_list:
+                info = info + "- " + memo + "\n"
+            if self.verbosity >= 1:
+                print(colored("\nMEMOS APPENDED TO LAST MESSAGE...\n" + info + "\n", "light_yellow"))
+            memo_texts = memo_texts + "\n" + info
+        return memo_texts
+
+    def _analyze(self, text_to_analyze: Union[dict[str, Any], str], analysis_instructions: Union[dict[str, Any], str]):
+        """Asks TextAnalyzerAgent to analyze the given text according to specific instructions."""
+        self.analyzer.reset()  # Clear the analyzer's list of messages.
+        self.teachable_agent.send(
+            recipient=self.analyzer, message=text_to_analyze, request_reply=False, silent=(self.verbosity < 2)
+        )  # Put the message in the analyzer's list.
+        self.teachable_agent.send(
+            recipient=self.analyzer, message=analysis_instructions, request_reply=True, silent=(self.verbosity < 2)
+        )  # Request the reply.
+        return self.teachable_agent.last_message(self.analyzer)["content"]
+
+
+@require_optional_import("chromadb", "teachable")
+class MemoStore:
+    """Provides memory storage and retrieval for a teachable agent, using a vector database.
+    Each DB entry (called a memo) is a pair of strings: an input text and an output text.
+    The input text might be a question, or a task to perform.
+    The output text might be an answer to the question, or advice on how to perform the task.
+    Vector embeddings are currently supplied by Chroma's default Sentence Transformers.
+    """
+
+    def __init__(
+        self,
+        verbosity: Optional[int] = 0,
+        reset: Optional[bool] = False,
+        path_to_db_dir: Optional[str] = "./tmp/teachable_agent_db",
+    ):
+        """Args:
+        - verbosity (Optional, int): 1 to print memory operations, 0 to omit them. 3+ to print memo lists.
+        - reset (Optional, bool): True to clear the DB before starting. Default False.
+        - path_to_db_dir (Optional, str): path to the directory where the DB is stored.
+        """
+        self.verbosity = verbosity
+        self.path_to_db_dir = path_to_db_dir
+
+        # Load or create the vector DB on disk.
+        settings = Settings(
+            anonymized_telemetry=False, allow_reset=True, is_persistent=True, persist_directory=path_to_db_dir
+        )
+        self.db_client = chromadb.Client(settings)
+        self.vec_db = self.db_client.create_collection("memos", get_or_create=True)  # The collection is the DB.
+
+        # Load or create the associated memo dict on disk.
+        self.path_to_dict = os.path.join(path_to_db_dir, "uid_text_dict.pkl")
+        self.uid_text_dict = {}
+        self.last_memo_id = 0
+        if (not reset) and os.path.exists(self.path_to_dict):
+            print(colored("\nLOADING MEMORY FROM DISK", "light_green"))
+            print(colored(f"    Location = {self.path_to_dict}", "light_green"))
+            with open(self.path_to_dict, "rb") as f:
+                self.uid_text_dict = pickle.load(f)
+                self.last_memo_id = len(self.uid_text_dict)
+                if self.verbosity >= 3:
+                    self.list_memos()
+
+        # Clear the DB if requested.
+        if reset:
+            self.reset_db()
+
+    def list_memos(self):
+        """Prints the contents of MemoStore."""
+        print(colored("LIST OF MEMOS", "light_green"))
+        for uid, text in self.uid_text_dict.items():
+            input_text, output_text = text
+            print(
+                colored(
+                    f"  ID: {uid}\n    INPUT TEXT: {input_text}\n    OUTPUT TEXT: {output_text}",
+                    "light_green",
+                )
+            )
+
+    def _save_memos(self):
+        """Saves self.uid_text_dict to disk."""
+        with open(self.path_to_dict, "wb") as file:
+            pickle.dump(self.uid_text_dict, file)
+
+    def reset_db(self):
+        """Forces immediate deletion of the DB's contents, in memory and on disk."""
+        print(colored("\nCLEARING MEMORY", "light_green"))
+        self.db_client.delete_collection("memos")
+        self.vec_db = self.db_client.create_collection("memos")
+        self.uid_text_dict = {}
+        self._save_memos()
+
+    def add_input_output_pair(self, input_text: str, output_text: str):
+        """Adds an input-output pair to the vector DB."""
+        self.last_memo_id += 1
+        self.vec_db.add(documents=[input_text], ids=[str(self.last_memo_id)])
+        self.uid_text_dict[str(self.last_memo_id)] = input_text, output_text
+        if self.verbosity >= 1:
+            print(
+                colored(
+                    f"\nINPUT-OUTPUT PAIR ADDED TO VECTOR DATABASE:\n  ID\n    {self.last_memo_id}\n  INPUT\n    {input_text}\n  OUTPUT\n    {output_text}\n",
+                    "light_yellow",
+                )
+            )
+        if self.verbosity >= 3:
+            self.list_memos()
+
+    def get_nearest_memo(self, query_text: str):
+        """Retrieves the nearest memo to the given query text."""
+        results = self.vec_db.query(query_texts=[query_text], n_results=1)
+        uid, input_text, distance = results["ids"][0][0], results["documents"][0][0], results["distances"][0][0]
+        input_text_2, output_text = self.uid_text_dict[uid]
+        assert input_text == input_text_2
+        if self.verbosity >= 1:
+            print(
+                colored(
+                    f"\nINPUT-OUTPUT PAIR RETRIEVED FROM VECTOR DATABASE:\n  INPUT1\n    {input_text}\n  OUTPUT\n    {output_text}\n  DISTANCE\n    {distance}",
+                    "light_yellow",
+                )
+            )
+        return input_text, output_text, distance
+
+    def get_related_memos(self, query_text: str, n_results: int, threshold: Union[int, float]):
+        """Retrieves memos that are related to the given query text within the specified distance threshold."""
+        if n_results > len(self.uid_text_dict):
+            n_results = len(self.uid_text_dict)
+        results = self.vec_db.query(query_texts=[query_text], n_results=n_results)
+        memos = []
+        num_results = len(results["ids"][0])
+        for i in range(num_results):
+            uid, input_text, distance = results["ids"][0][i], results["documents"][0][i], results["distances"][0][i]
+            if distance < threshold:
+                input_text_2, output_text = self.uid_text_dict[uid]
+                assert input_text == input_text_2
+                if self.verbosity >= 1:
+                    print(
+                        colored(
+                            f"\nINPUT-OUTPUT PAIR RETRIEVED FROM VECTOR DATABASE:\n  INPUT1\n    {input_text}\n  OUTPUT\n    {output_text}\n  DISTANCE\n    {distance}",
+                            "light_yellow",
+                        )
+                    )
+                memos.append((input_text, output_text, distance))
+        return memos
+
+    def prepopulate(self):
+        """Adds a few arbitrary examples to the vector DB, just to make retrieval less trivial."""
+        if self.verbosity >= 1:
+            print(colored("\nPREPOPULATING MEMORY", "light_green"))
+        examples = []
+        examples.append({"text": "When I say papers I mean research papers, which are typically pdfs.", "label": "yes"})
+        examples.append({"text": "Please verify that each paper you listed actually uses langchain.", "label": "no"})
+        examples.append({"text": "Tell gpt the output should still be latex code.", "label": "no"})
+        examples.append({"text": "Hint: convert pdfs to text and then answer questions based on them.", "label": "yes"})
+        examples.append({
+            "text": "To create a good PPT, include enough content to make it interesting.",
+            "label": "yes",
+        })
+        examples.append({
+            "text": "No, for this case the columns should be aspects and the rows should be frameworks.",
+            "label": "no",
+        })
+        examples.append({"text": "When writing code, remember to include any libraries that are used.", "label": "yes"})
+        examples.append({"text": "Please summarize the papers by Eric Horvitz on bounded rationality.", "label": "no"})
+        examples.append({"text": "Compare the h-index of Daniel Weld and Oren Etzioni.", "label": "no"})
+        examples.append({
+            "text": "Double check to be sure that the columns in a table correspond to what was asked for.",
+            "label": "yes",
+        })
+        for example in examples:
+            self.add_input_output_pair(example["text"], example["label"])
+        self._save_memos()
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/text_compressors.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/text_compressors.py
new file mode 100644
index 0000000..ef4b6ef
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/text_compressors.py
@@ -0,0 +1,66 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import Any, Protocol
+
+from ....import_utils import optional_import_block, require_optional_import
+
+with optional_import_block() as result:
+    import llmlingua
+    from llmlingua import PromptCompressor
+
+
+class TextCompressor(Protocol):
+    """Defines a protocol for text compression to optimize agent interactions."""
+
+    def compress_text(self, text: str, **compression_params) -> dict[str, Any]:
+        """This method takes a string as input and returns a dictionary containing the compressed text and other
+        relevant information. The compressed text should be stored under the 'compressed_text' key in the dictionary.
+        To calculate the number of saved tokens, the dictionary should include 'origin_tokens' and 'compressed_tokens' keys.
+        """
+        ...
+
+
+@require_optional_import("llmlingua", "long-context")
+class LLMLingua:
+    """Compresses text messages using LLMLingua for improved efficiency in processing and response generation.
+
+    NOTE: The effectiveness of compression and the resultant token savings can vary based on the content of the messages
+    and the specific configurations used for the PromptCompressor.
+    """
+
+    def __init__(
+        self,
+        prompt_compressor_kwargs: dict = dict(
+            model_name="microsoft/llmlingua-2-bert-base-multilingual-cased-meetingbank",
+            use_llmlingua2=True,
+            device_map="cpu",
+        ),
+        structured_compression: bool = False,
+    ) -> None:
+        """Args:
+            prompt_compressor_kwargs (dict): A dictionary of keyword arguments for the PromptCompressor. Defaults to a
+                dictionary with model_name set to "microsoft/llmlingua-2-bert-base-multilingual-cased-meetingbank",
+                use_llmlingua2 set to True, and device_map set to "cpu".
+            structured_compression (bool): A flag indicating whether to use structured compression. If True, the
+                structured_compress_prompt method of the PromptCompressor is used. Otherwise, the compress_prompt method
+                is used. Defaults to False.
+                dictionary.
+
+        Raises:
+            ImportError: If the llmlingua library is not installed.
+        """
+        self._prompt_compressor = PromptCompressor(**prompt_compressor_kwargs)
+
+        assert isinstance(self._prompt_compressor, llmlingua.PromptCompressor)
+        self._compression_method = (
+            self._prompt_compressor.structured_compress_prompt
+            if structured_compression
+            else self._prompt_compressor.compress_prompt
+        )
+
+    def compress_text(self, text: str, **compression_params) -> dict[str, Any]:
+        return self._compression_method([text], **compression_params)
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/tools_capability.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/tools_capability.py
new file mode 100644
index 0000000..bd69396
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/tools_capability.py
@@ -0,0 +1,22 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from ....agentchat import ConversableAgent
+from ....tools import Tool
+
+
+class ToolsCapability:
+    """Adding a list of tools as composable capabilities to a single agent.
+    This class can be inherited from to allow code to run at the point of creating or adding the capability.
+
+    Note: both caller and executor of the tools are the same agent.
+    """
+
+    def __init__(self, tool_list: list[Tool]):
+        self.tools = [tool for tool in tool_list]
+
+    def add_to_agent(self, agent: ConversableAgent):
+        """Add tools to the given agent."""
+        for tool in self.tools:
+            tool.register_tool(agent=agent)
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/transform_messages.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transform_messages.py
new file mode 100644
index 0000000..ad6c537
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transform_messages.py
@@ -0,0 +1,93 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import copy
+from typing import TYPE_CHECKING, Any
+
+from ....formatting_utils import colored
+from .transforms import MessageTransform
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+
+
+class TransformMessages:
+    """Agent capability for transforming messages before reply generation.
+
+    This capability allows you to apply a series of message transformations to
+    a ConversableAgent's incoming messages before they are processed for response
+    generation. This is useful for tasks such as:
+
+    - Limiting the number of messages considered for context.
+    - Truncating messages to meet token limits.
+    - Filtering sensitive information.
+    - Customizing message formatting.
+
+    To use `TransformMessages`:
+
+    1. Create message transformations (e.g., `MessageHistoryLimiter`, `MessageTokenLimiter`).
+    2. Instantiate `TransformMessages` with a list of these transformations.
+    3. Add the `TransformMessages` instance to your `ConversableAgent` using `add_to_agent`.
+
+    NOTE: Order of message transformations is important. You could get different results based on
+        the order of transformations.
+
+    Example:
+        ```python
+        from agentchat import ConversableAgent
+        from agentchat.contrib.capabilities import TransformMessages, MessageHistoryLimiter, MessageTokenLimiter
+
+        max_messages = MessageHistoryLimiter(max_messages=2)
+        truncate_messages = MessageTokenLimiter(max_tokens=500)
+        transform_messages = TransformMessages(transforms=[max_messages, truncate_messages])
+
+        agent = ConversableAgent(...)
+        transform_messages.add_to_agent(agent)
+        ```
+    """
+
+    def __init__(self, *, transforms: list[MessageTransform] = [], verbose: bool = True):
+        """Args:
+        transforms: A list of message transformations to apply.
+        verbose: Whether to print logs of each transformation or not.
+        """
+        self._transforms = transforms
+        self._verbose = verbose
+
+    def add_to_agent(self, agent: "ConversableAgent"):
+        """Adds the message transformations capability to the specified ConversableAgent.
+
+        This function performs the following modifications to the agent:
+
+        1. Registers a hook that automatically transforms all messages before they are processed for
+            response generation.
+        """
+        agent.register_hook(hookable_method="process_all_messages_before_reply", hook=self._transform_messages)
+
+    def _transform_messages(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        post_transform_messages = copy.deepcopy(messages)
+        system_message = None
+
+        if messages[0]["role"] == "system":
+            system_message = copy.deepcopy(messages[0])
+            post_transform_messages.pop(0)
+
+        for transform in self._transforms:
+            # deepcopy in case pre_transform_messages will later be used for logs printing
+            pre_transform_messages = (
+                copy.deepcopy(post_transform_messages) if self._verbose else post_transform_messages
+            )
+            post_transform_messages = transform.apply_transform(pre_transform_messages)
+
+            if self._verbose:
+                logs_str, had_effect = transform.get_logs(pre_transform_messages, post_transform_messages)
+                if had_effect:
+                    print(colored(logs_str, "yellow"))
+
+        if system_message:
+            post_transform_messages.insert(0, system_message)
+
+        return post_transform_messages
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms.py
new file mode 100644
index 0000000..cedb1cb
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms.py
@@ -0,0 +1,579 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import copy
+import sys
+from typing import Any, Optional, Protocol, Union
+
+import tiktoken
+from termcolor import colored
+
+from .... import token_count_utils
+from ....cache import AbstractCache, Cache
+from ....types import MessageContentType
+from . import transforms_util
+from .text_compressors import LLMLingua, TextCompressor
+
+
+class MessageTransform(Protocol):
+    """Defines a contract for message transformation.
+
+    Classes implementing this protocol should provide an `apply_transform` method
+    that takes a list of messages and returns the transformed list.
+    """
+
+    def apply_transform(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Applies a transformation to a list of messages.
+
+        Args:
+            messages: A list of dictionaries representing messages.
+
+        Returns:
+            A new list of dictionaries containing the transformed messages.
+        """
+        ...
+
+    def get_logs(
+        self, pre_transform_messages: list[dict[str, Any]], post_transform_messages: list[dict[str, Any]]
+    ) -> tuple[str, bool]:
+        """Creates the string including the logs of the transformation
+
+        Alongside the string, it returns a boolean indicating whether the transformation had an effect or not.
+
+        Args:
+            pre_transform_messages: A list of dictionaries representing messages before the transformation.
+            post_transform_messages: A list of dictionaries representig messages after the transformation.
+
+        Returns:
+            A tuple with a string with the logs and a flag indicating whether the transformation had an effect or not.
+        """
+        ...
+
+
+class MessageHistoryLimiter:
+    """Limits the number of messages considered by an agent for response generation.
+
+    This transform keeps only the most recent messages up to the specified maximum number of messages (max_messages).
+    It trims the conversation history by removing older messages, retaining only the most recent messages.
+    """
+
+    def __init__(
+        self,
+        max_messages: Optional[int] = None,
+        keep_first_message: bool = False,
+        exclude_names: Optional[list[str]] = None,
+    ):
+        """Args:
+        max_messages Optional[int]: Maximum number of messages to keep in the context. Must be greater than 0 if not None.
+        keep_first_message bool: Whether to keep the original first message in the conversation history.
+            Defaults to False.
+        exclude_names Optional[list[str]]: List of message sender names to exclude from the message history.
+            Messages from these senders will be filtered out before applying the message limit. Defaults to None.
+        """
+        self._validate_max_messages(max_messages)
+        self._max_messages = max_messages
+        self._keep_first_message = keep_first_message
+        self._exclude_names = exclude_names
+
+    def apply_transform(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Truncates the conversation history to the specified maximum number of messages.
+
+        This method returns a new list containing the most recent messages up to the specified
+        maximum number of messages (max_messages). If max_messages is None, it returns the
+        original list of messages unmodified.
+
+        Args:
+            messages (List[Dict]): The list of messages representing the conversation history.
+
+        Returns:
+            List[Dict]: A new list containing the most recent messages up to the specified maximum.
+        """
+
+        exclude_names = getattr(self, "_exclude_names", None)
+
+        filtered = [msg for msg in messages if msg.get("name") not in exclude_names] if exclude_names else messages
+
+        if self._max_messages is None or len(filtered) <= self._max_messages:
+            return filtered
+
+        truncated_messages = []
+        remaining_count = self._max_messages
+
+        # Start with the first message if we need to keep it
+        if self._keep_first_message and filtered:
+            truncated_messages = [filtered[0]]
+            remaining_count -= 1
+
+        # Loop through messages in reverse
+        for i in range(len(filtered) - 1, 0, -1):
+            if remaining_count > 1:
+                truncated_messages.insert(1 if self._keep_first_message else 0, filtered[i])
+            if remaining_count == 1:  # noqa: SIM102
+                # If there's only 1 slot left and it's a 'tools' message, ignore it.
+                if filtered[i].get("role") != "tool":
+                    truncated_messages.insert(1, filtered[i])
+
+            remaining_count -= 1
+            if remaining_count == 0:
+                break
+
+        return truncated_messages
+
+    def get_logs(
+        self, pre_transform_messages: list[dict[str, Any]], post_transform_messages: list[dict[str, Any]]
+    ) -> tuple[str, bool]:
+        pre_transform_messages_len = len(pre_transform_messages)
+        post_transform_messages_len = len(post_transform_messages)
+
+        if post_transform_messages_len < pre_transform_messages_len:
+            logs_str = (
+                f"Removed {pre_transform_messages_len - post_transform_messages_len} messages. "
+                f"Number of messages reduced from {pre_transform_messages_len} to {post_transform_messages_len}."
+            )
+            return logs_str, True
+        return "No messages were removed.", False
+
+    def _validate_max_messages(self, max_messages: Optional[int]):
+        if max_messages is not None and max_messages < 1:
+            raise ValueError("max_messages must be None or greater than 1")
+
+
+class MessageTokenLimiter:
+    """Truncates messages to meet token limits for efficient processing and response generation.
+
+    This transformation applies two levels of truncation to the conversation history:
+
+    1. Truncates each individual message to the maximum number of tokens specified by max_tokens_per_message.
+    2. Truncates the overall conversation history to the maximum number of tokens specified by max_tokens.
+
+    NOTE: Tokens are counted using the encoder for the specified model. Different models may yield different token
+        counts for the same text.
+
+    NOTE: For multimodal LLMs, the token count may be inaccurate as it does not account for the non-text input
+        (e.g images).
+
+    The truncation process follows these steps in order:
+
+    1. The minimum tokens threshold (`min_tokens`) is checked (0 by default). If the total number of tokens in messages
+        is less than this threshold, then the messages are returned as is. In other case, the following process is applied.
+    2. Messages are processed in reverse order (newest to oldest).
+    3. Individual messages are truncated based on max_tokens_per_message. For multimodal messages containing both text
+        and other types of content, only the text content is truncated.
+    4. The overall conversation history is truncated based on the max_tokens limit. Once the accumulated token count
+        exceeds this limit, the current message being processed get truncated to meet the total token count and any
+        remaining messages get discarded.
+    5. The truncated conversation history is reconstructed by prepending the messages to a new list to preserve the
+        original message order.
+    """
+
+    def __init__(
+        self,
+        max_tokens_per_message: Optional[int] = None,
+        max_tokens: Optional[int] = None,
+        min_tokens: Optional[int] = None,
+        model: str = "gpt-3.5-turbo-0613",
+        filter_dict: Optional[dict[str, Any]] = None,
+        exclude_filter: bool = True,
+    ):
+        """Args:
+        max_tokens_per_message (None or int): Maximum number of tokens to keep in each message.
+            Must be greater than or equal to 0 if not None.
+        max_tokens (Optional[int]): Maximum number of tokens to keep in the chat history.
+            Must be greater than or equal to 0 if not None.
+        min_tokens (Optional[int]): Minimum number of tokens in messages to apply the transformation.
+            Must be greater than or equal to 0 if not None.
+        model (str): The target OpenAI model for tokenization alignment.
+        filter_dict (None or dict): A dictionary to filter out messages that you want/don't want to compress.
+            If None, no filters will be applied.
+        exclude_filter (bool): If exclude filter is True (the default value), messages that match the filter will be
+            excluded from token truncation. If False, messages that match the filter will be truncated.
+        """
+        self._model = model
+        self._max_tokens_per_message = self._validate_max_tokens(max_tokens_per_message)
+        self._max_tokens = self._validate_max_tokens(max_tokens)
+        self._min_tokens = self._validate_min_tokens(min_tokens, max_tokens)
+        self._filter_dict = filter_dict
+        self._exclude_filter = exclude_filter
+
+    def apply_transform(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Applies token truncation to the conversation history.
+
+        Args:
+            messages (List[Dict]): The list of messages representing the conversation history.
+
+        Returns:
+            List[Dict]: A new list containing the truncated messages up to the specified token limits.
+        """
+        assert self._max_tokens_per_message is not None
+        assert self._max_tokens is not None
+        assert self._min_tokens is not None
+
+        # if the total number of tokens in the messages is less than the min_tokens, return the messages as is
+        if not transforms_util.min_tokens_reached(messages, self._min_tokens):
+            return messages
+
+        temp_messages = copy.deepcopy(messages)
+        processed_messages = []
+        processed_messages_tokens = 0
+
+        for msg in reversed(temp_messages):
+            # Some messages may not have content.
+            if not transforms_util.is_content_right_type(msg.get("content")):
+                processed_messages.insert(0, msg)
+                continue
+
+            if not transforms_util.should_transform_message(msg, self._filter_dict, self._exclude_filter):
+                processed_messages.insert(0, msg)
+                processed_messages_tokens += transforms_util.count_text_tokens(msg["content"])
+                continue
+
+            expected_tokens_remained = self._max_tokens - processed_messages_tokens - self._max_tokens_per_message
+
+            # If adding this message would exceed the token limit, truncate the last message to meet the total token
+            # limit and discard all remaining messages
+            if expected_tokens_remained < 0:
+                msg["content"] = self._truncate_str_to_tokens(
+                    msg["content"], self._max_tokens - processed_messages_tokens
+                )
+                processed_messages.insert(0, msg)
+                break
+
+            msg["content"] = self._truncate_str_to_tokens(msg["content"], self._max_tokens_per_message)
+            msg_tokens = transforms_util.count_text_tokens(msg["content"])
+
+            # prepend the message to the list to preserve order
+            processed_messages_tokens += msg_tokens
+            processed_messages.insert(0, msg)
+
+        return processed_messages
+
+    def get_logs(
+        self, pre_transform_messages: list[dict[str, Any]], post_transform_messages: list[dict[str, Any]]
+    ) -> tuple[str, bool]:
+        pre_transform_messages_tokens = sum(
+            transforms_util.count_text_tokens(msg["content"]) for msg in pre_transform_messages if "content" in msg
+        )
+        post_transform_messages_tokens = sum(
+            transforms_util.count_text_tokens(msg["content"]) for msg in post_transform_messages if "content" in msg
+        )
+
+        if post_transform_messages_tokens < pre_transform_messages_tokens:
+            logs_str = (
+                f"Truncated {pre_transform_messages_tokens - post_transform_messages_tokens} tokens. "
+                f"Number of tokens reduced from {pre_transform_messages_tokens} to {post_transform_messages_tokens}"
+            )
+            return logs_str, True
+        return "No tokens were truncated.", False
+
+    def _truncate_str_to_tokens(self, contents: Union[str, list], n_tokens: int) -> Union[str, list]:
+        if isinstance(contents, str):
+            return self._truncate_tokens(contents, n_tokens)
+        elif isinstance(contents, list):
+            return self._truncate_multimodal_text(contents, n_tokens)
+        else:
+            raise ValueError(f"Contents must be a string or a list of dictionaries. Received type: {type(contents)}")
+
+    def _truncate_multimodal_text(self, contents: list[dict[str, Any]], n_tokens: int) -> list[dict[str, Any]]:
+        """Truncates text content within a list of multimodal elements, preserving the overall structure."""
+        tmp_contents = []
+        for content in contents:
+            if content["type"] == "text":
+                truncated_text = self._truncate_tokens(content["text"], n_tokens)
+                tmp_contents.append({"type": "text", "text": truncated_text})
+            else:
+                tmp_contents.append(content)
+        return tmp_contents
+
+    def _truncate_tokens(self, text: str, n_tokens: int) -> str:
+        encoding = tiktoken.encoding_for_model(self._model)  # Get the appropriate tokenizer
+
+        encoded_tokens = encoding.encode(text)
+        truncated_tokens = encoded_tokens[:n_tokens]
+        truncated_text = encoding.decode(truncated_tokens)  # Decode back to text
+
+        return truncated_text
+
+    def _validate_max_tokens(self, max_tokens: Optional[int] = None) -> Optional[int]:
+        if max_tokens is not None and max_tokens < 0:
+            raise ValueError("max_tokens and max_tokens_per_message must be None or greater than or equal to 0")
+
+        try:
+            allowed_tokens = token_count_utils.get_max_token_limit(self._model)
+        except Exception:
+            print(colored(f"Model {self._model} not found in token_count_utils.", "yellow"))
+            allowed_tokens = None
+
+        if max_tokens is not None and allowed_tokens is not None and max_tokens > allowed_tokens:
+            print(
+                colored(
+                    f"Max token was set to {max_tokens}, but {self._model} can only accept {allowed_tokens} tokens. Capping it to {allowed_tokens}.",
+                    "yellow",
+                )
+            )
+            return allowed_tokens
+
+        return max_tokens if max_tokens is not None else sys.maxsize
+
+    def _validate_min_tokens(self, min_tokens: Optional[int], max_tokens: Optional[int]) -> int:
+        if min_tokens is None:
+            return 0
+        if min_tokens < 0:
+            raise ValueError("min_tokens must be None or greater than or equal to 0.")
+        if max_tokens is not None and min_tokens > max_tokens:
+            raise ValueError("min_tokens must not be more than max_tokens.")
+        return min_tokens
+
+
+class TextMessageCompressor:
+    """A transform for compressing text messages in a conversation history.
+
+    It uses a specified text compression method to reduce the token count of messages, which can lead to more efficient
+    processing and response generation by downstream models.
+    """
+
+    def __init__(
+        self,
+        text_compressor: Optional[TextCompressor] = None,
+        min_tokens: Optional[int] = None,
+        compression_params: dict = dict(),
+        cache: Optional[AbstractCache] = None,
+        filter_dict: Optional[dict[str, Any]] = None,
+        exclude_filter: bool = True,
+    ):
+        """Args:
+        text_compressor (TextCompressor or None): An instance of a class that implements the TextCompressor
+            protocol. If None, it defaults to LLMLingua.
+        min_tokens (int or None): Minimum number of tokens in messages to apply the transformation. Must be greater
+            than or equal to 0 if not None. If None, no threshold-based compression is applied.
+        compression_args (dict): A dictionary of arguments for the compression method. Defaults to an empty
+            dictionary.
+        cache (None or AbstractCache): The cache client to use to store and retrieve previously compressed messages.
+            If None, no caching will be used.
+        filter_dict (None or dict): A dictionary to filter out messages that you want/don't want to compress.
+            If None, no filters will be applied.
+        exclude_filter (bool): If exclude filter is True (the default value), messages that match the filter will be
+            excluded from compression. If False, messages that match the filter will be compressed.
+        """
+        if text_compressor is None:
+            text_compressor = LLMLingua()
+
+        self._validate_min_tokens(min_tokens)
+
+        self._text_compressor = text_compressor
+        self._min_tokens = min_tokens
+        self._compression_args = compression_params
+        self._filter_dict = filter_dict
+        self._exclude_filter = exclude_filter
+
+        if cache is None:
+            self._cache = Cache.disk()
+        else:
+            self._cache = cache
+
+        # Optimizing savings calculations to optimize log generation
+        self._recent_tokens_savings = 0
+
+    def apply_transform(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Applies compression to messages in a conversation history based on the specified configuration.
+
+        The function processes each message according to the `compression_args` and `min_tokens` settings, applying
+        the specified compression configuration and returning a new list of messages with reduced token counts
+        where possible.
+
+        Args:
+            messages (List[Dict]): A list of message dictionaries to be compressed.
+
+        Returns:
+            List[Dict]: A list of dictionaries with the message content compressed according to the configured
+                method and scope.
+        """
+        # Make sure there is at least one message
+        if not messages:
+            return messages
+
+        # if the total number of tokens in the messages is less than the min_tokens, return the messages as is
+        if not transforms_util.min_tokens_reached(messages, self._min_tokens):
+            return messages
+
+        total_savings = 0
+        processed_messages = messages.copy()
+        for message in processed_messages:
+            # Some messages may not have content.
+            if not transforms_util.is_content_right_type(message.get("content")):
+                continue
+
+            if not transforms_util.should_transform_message(message, self._filter_dict, self._exclude_filter):
+                continue
+
+            if transforms_util.is_content_text_empty(message["content"]):
+                continue
+
+            cache_key = transforms_util.cache_key(message["content"], self._min_tokens)
+            cached_content = transforms_util.cache_content_get(self._cache, cache_key)
+            if cached_content is not None:
+                message["content"], savings = cached_content
+            else:
+                message["content"], savings = self._compress(message["content"])
+
+            transforms_util.cache_content_set(self._cache, cache_key, message["content"], savings)
+
+            assert isinstance(savings, int)
+            total_savings += savings
+
+        self._recent_tokens_savings = total_savings
+        return processed_messages
+
+    def get_logs(
+        self, pre_transform_messages: list[dict[str, Any]], post_transform_messages: list[dict[str, Any]]
+    ) -> tuple[str, bool]:
+        if self._recent_tokens_savings > 0:
+            return f"{self._recent_tokens_savings} tokens saved with text compression.", True
+        else:
+            return "No tokens saved with text compression.", False
+
+    def _compress(self, content: MessageContentType) -> tuple[MessageContentType, int]:
+        """Compresses the given text or multimodal content using the specified compression method."""
+        if isinstance(content, str):
+            return self._compress_text(content)
+        elif isinstance(content, list):
+            return self._compress_multimodal(content)
+        else:
+            return content, 0
+
+    def _compress_multimodal(self, content: MessageContentType) -> tuple[MessageContentType, int]:
+        tokens_saved = 0
+        for item in content:
+            if isinstance(item, dict) and "text" in item:
+                item["text"], savings = self._compress_text(item["text"])
+                tokens_saved += savings
+
+            elif isinstance(item, str):
+                item, savings = self._compress_text(item)
+                tokens_saved += savings
+
+        return content, tokens_saved
+
+    def _compress_text(self, text: str) -> tuple[str, int]:
+        """Compresses the given text using the specified compression method."""
+        compressed_text = self._text_compressor.compress_text(text, **self._compression_args)
+
+        savings = 0
+        if "origin_tokens" in compressed_text and "compressed_tokens" in compressed_text:
+            savings = compressed_text["origin_tokens"] - compressed_text["compressed_tokens"]
+
+        return compressed_text["compressed_prompt"], savings
+
+    def _validate_min_tokens(self, min_tokens: Optional[int]):
+        if min_tokens is not None and min_tokens <= 0:
+            raise ValueError("min_tokens must be greater than 0 or None")
+
+
+class TextMessageContentName:
+    """A transform for including the agent's name in the content of a message.
+
+    How to create and apply the transform:
+    # Imports
+    from autogen.agentchat.contrib.capabilities import transform_messages, transforms
+
+    # Create Transform
+    name_transform = transforms.TextMessageContentName(position="start", format_string="'{name}' said:\n")
+
+    # Create the TransformMessages
+    context_handling = transform_messages.TransformMessages(
+                transforms=[
+                    name_transform
+                ]
+            )
+
+    # Add it to an agent so when they run inference it will apply to the messages
+    context_handling.add_to_agent(my_agent)
+    """
+
+    def __init__(
+        self,
+        position: str = "start",
+        format_string: str = "{name}:\n",
+        deduplicate: bool = True,
+        filter_dict: Optional[dict[str, Any]] = None,
+        exclude_filter: bool = True,
+    ):
+        """Args:
+        position (str): The position to add the name to the content. The possible options are 'start' or 'end'. Defaults to 'start'.
+        format_string (str): The f-string to format the message name with. Use '{name}' as a placeholder for the agent's name. Defaults to '{name}:\n' and must contain '{name}'.
+        deduplicate (bool): Whether to deduplicate the formatted string so it doesn't appear twice (sometimes the LLM will add it to new messages itself). Defaults to True.
+        filter_dict (None or dict): A dictionary to filter out messages that you want/don't want to compress.
+            If None, no filters will be applied.
+        exclude_filter (bool): If exclude filter is True (the default value), messages that match the filter will be
+            excluded from compression. If False, messages that match the filter will be compressed.
+        """
+        assert isinstance(position, str) and position in ["start", "end"]
+        assert isinstance(format_string, str) and "{name}" in format_string
+        assert isinstance(deduplicate, bool) and deduplicate is not None
+
+        self._position = position
+        self._format_string = format_string
+        self._deduplicate = deduplicate
+        self._filter_dict = filter_dict
+        self._exclude_filter = exclude_filter
+
+        # Track the number of messages changed for logging
+        self._messages_changed = 0
+
+    def apply_transform(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Applies the name change to the message based on the position and format string.
+
+        Args:
+            messages (List[Dict]): A list of message dictionaries.
+
+        Returns:
+            List[Dict]: A list of dictionaries with the message content updated with names.
+        """
+        # Make sure there is at least one message
+        if not messages:
+            return messages
+
+        messages_changed = 0
+        processed_messages = copy.deepcopy(messages)
+        for message in processed_messages:
+            # Some messages may not have content.
+            if not transforms_util.is_content_right_type(
+                message.get("content")
+            ) or not transforms_util.is_content_right_type(message.get("name")):
+                continue
+
+            if not transforms_util.should_transform_message(message, self._filter_dict, self._exclude_filter):
+                continue
+
+            if transforms_util.is_content_text_empty(message["content"]) or transforms_util.is_content_text_empty(
+                message["name"]
+            ):
+                continue
+
+            # Get and format the name in the content
+            content = message["content"]
+            formatted_name = self._format_string.format(name=message["name"])
+
+            if self._position == "start":
+                if not self._deduplicate or not content.startswith(formatted_name):
+                    message["content"] = f"{formatted_name}{content}"
+
+                    messages_changed += 1
+            else:
+                if not self._deduplicate or not content.endswith(formatted_name):
+                    message["content"] = f"{content}{formatted_name}"
+
+                    messages_changed += 1
+
+        self._messages_changed = messages_changed
+        return processed_messages
+
+    def get_logs(
+        self, pre_transform_messages: list[dict[str, Any]], post_transform_messages: list[dict[str, Any]]
+    ) -> tuple[str, bool]:
+        if self._messages_changed > 0:
+            return f"{self._messages_changed} message(s) changed to incorporate name.", True
+        else:
+            return "No messages changed to incorporate name.", False
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms_util.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms_util.py
new file mode 100644
index 0000000..0aa73c1
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/transforms_util.py
@@ -0,0 +1,122 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from collections.abc import Hashable
+from typing import Any, Optional
+
+from .... import token_count_utils
+from ....cache.abstract_cache_base import AbstractCache
+from ....oai.openai_utils import filter_config
+from ....types import MessageContentType
+
+
+def cache_key(content: MessageContentType, *args: Hashable) -> str:
+    """Calculates the cache key for the given message content and any other hashable args.
+
+    Args:
+        content (MessageContentType): The message content to calculate the cache key for.
+        *args: Any additional hashable args to include in the cache key.
+    """
+    str_keys = [str(key) for key in (content, *args)]
+    return "".join(str_keys)
+
+
+def cache_content_get(cache: Optional[AbstractCache], key: str) -> Optional[tuple[MessageContentType, ...]]:
+    """Retrieves cached content from the cache.
+
+    Args:
+        cache (None or AbstractCache): The cache to retrieve the content from. If None, the cache is ignored.
+        key (str): The key to retrieve the content from.
+    """
+    if cache:
+        cached_value = cache.get(key)
+        if cached_value:
+            return cached_value
+
+
+def cache_content_set(cache: Optional[AbstractCache], key: str, content: MessageContentType, *extra_values):
+    """Sets content into the cache.
+
+    Args:
+        cache (None or AbstractCache): The cache to set the content into. If None, the cache is ignored.
+        key (str): The key to set the content into.
+        content (MessageContentType): The message content to set into the cache.
+        *extra_values: Additional values to be passed to the cache.
+    """
+    if cache:
+        cache_value = (content, *extra_values)
+        cache.set(key, cache_value)
+
+
+def min_tokens_reached(messages: list[dict[str, Any]], min_tokens: Optional[int]) -> bool:
+    """Returns True if the total number of tokens in the messages is greater than or equal to the specified value.
+
+    Args:
+        messages (List[Dict]): A list of messages to check.
+        min_tokens (None or int): The minimum number of tokens to check for.
+    """
+    if not min_tokens:
+        return True
+
+    messages_tokens = sum(count_text_tokens(msg["content"]) for msg in messages if "content" in msg)
+    return messages_tokens >= min_tokens
+
+
+def count_text_tokens(content: MessageContentType) -> int:
+    """Calculates the number of text tokens in the given message content.
+
+    Args:
+        content (MessageContentType): The message content to calculate the number of text tokens for.
+    """
+    token_count = 0
+    if isinstance(content, str):
+        token_count = token_count_utils.count_token(content)
+    elif isinstance(content, list):
+        for item in content:
+            if isinstance(item, str):
+                token_count += token_count_utils.count_token(item)
+            else:
+                token_count += count_text_tokens(item.get("text", ""))
+    return token_count
+
+
+def is_content_right_type(content: Any) -> bool:
+    """A helper function to check if the passed in content is of the right type."""
+    return isinstance(content, (str, list))
+
+
+def is_content_text_empty(content: MessageContentType) -> bool:
+    """Checks if the content of the message does not contain any text.
+
+    Args:
+        content (MessageContentType): The message content to check.
+    """
+    if isinstance(content, str):
+        return content == ""
+    elif isinstance(content, list):
+        texts = []
+        for item in content:
+            if isinstance(item, str):
+                texts.append(item)
+            elif isinstance(item, dict):
+                texts.append(item.get("text", ""))
+        return not any(texts)
+    else:
+        return True
+
+
+def should_transform_message(message: dict[str, Any], filter_dict: Optional[dict[str, Any]], exclude: bool) -> bool:
+    """Validates whether the transform should be applied according to the filter dictionary.
+
+    Args:
+        message (Dict[str, Any]): The message to validate.
+        filter_dict (None or Dict[str, Any]): The filter dictionary to validate against. If None, the transform is always applied.
+        exclude (bool): Whether to exclude messages that match the filter dictionary.
+    """
+    if not filter_dict:
+        return True
+
+    return len(filter_config([message], filter_dict, exclude)) > 0
diff --git a/mm_agents/coact/autogen/agentchat/contrib/capabilities/vision_capability.py b/mm_agents/coact/autogen/agentchat/contrib/capabilities/vision_capability.py
new file mode 100644
index 0000000..a0035c8
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/capabilities/vision_capability.py
@@ -0,0 +1,212 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import copy
+from typing import Any, Callable, Optional, Union
+
+from ....code_utils import content_str
+from ....oai.client import OpenAIWrapper
+from ...assistant_agent import ConversableAgent
+from ..img_utils import (
+    convert_base64_to_data_uri,
+    get_image_data,
+    get_pil_image,
+    gpt4v_formatter,
+)
+from .agent_capability import AgentCapability
+
+DEFAULT_DESCRIPTION_PROMPT = (
+    "Write a detailed caption for this image. "
+    "Pay special attention to any details that might be useful or relevant "
+    "to the ongoing conversation."
+)
+
+
+class VisionCapability(AgentCapability):
+    """We can add vision capability to regular ConversableAgent, even if the agent does not have the multimodal capability,
+    such as GPT-3.5-turbo agent, Llama, Orca, or Mistral agents. This vision capability will invoke a LMM client to describe
+    the image (captioning) before sending the information to the agent's actual client.
+
+        The vision capability will hook to the ConversableAgent's `process_last_received_message`.
+
+        Some technical details:
+        When the agent (who has the vision capability) received an message, it will:
+        1. _process_received_message:
+            a. _append_oai_message
+        2. generate_reply: if the agent is a MultimodalAgent, it will also use the image tag.
+            a. hook process_last_received_message (NOTE: this is where the vision capability will be hooked to.)
+            b. hook process_all_messages_before_reply
+        3. send:
+            a. hook process_message_before_send
+            b. _append_oai_message
+    """
+
+    def __init__(
+        self,
+        lmm_config: dict[str, Any],
+        description_prompt: Optional[str] = DEFAULT_DESCRIPTION_PROMPT,
+        custom_caption_func: Callable = None,
+    ) -> None:
+        """Initializes a new instance, setting up the configuration for interacting with
+        a Language Multimodal (LMM) client and specifying optional parameters for image
+        description and captioning.
+
+        Args:
+            lmm_config (Dict): Configuration for the LMM client, which is used to call
+                the LMM service for describing the image. This must be a dictionary containing
+                the necessary configuration parameters. If `lmm_config` is False or an empty dictionary,
+                it is considered invalid, and initialization will assert.
+            description_prompt (Optional[str], optional): The prompt to use for generating
+                descriptions of the image. This parameter allows customization of the
+                prompt passed to the LMM service. Defaults to `DEFAULT_DESCRIPTION_PROMPT` if not provided.
+            custom_caption_func (Callable, optional): A callable that, if provided, will be used
+                to generate captions for images. This allows for custom captioning logic outside
+                of the standard LMM service interaction.
+                The callable should take three parameters as input:
+                    1. an image URL (or local location)
+                    2. image_data (a PIL image)
+                    3. lmm_client (to call remote LMM)
+                and then return a description (as string).
+                If not provided, captioning will rely on the LMM client configured via `lmm_config`.
+                If provided, we will not run the default self._get_image_caption method.
+
+        Raises:
+            AssertionError: If neither a valid `lmm_config` nor a `custom_caption_func` is provided,
+                an AssertionError is raised to indicate that the Vision Capability requires
+                one of these to be valid for operation.
+        """
+        self._lmm_config = lmm_config
+        self._description_prompt = description_prompt
+        self._parent_agent = None
+
+        if lmm_config:
+            self._lmm_client = OpenAIWrapper(**lmm_config)
+        else:
+            self._lmm_client = None
+
+        self._custom_caption_func = custom_caption_func
+        assert self._lmm_config or custom_caption_func, (
+            "Vision Capability requires a valid lmm_config or custom_caption_func."
+        )
+
+    def add_to_agent(self, agent: ConversableAgent) -> None:
+        self._parent_agent = agent
+
+        # Append extra info to the system message.
+        agent.update_system_message(agent.system_message + "\nYou've been given the ability to interpret images.")
+
+        # Register a hook for processing the last message.
+        agent.register_hook(hookable_method="process_last_received_message", hook=self.process_last_received_message)
+
+    def process_last_received_message(self, content: Union[str, list[dict[str, Any]]]) -> str:
+        """Processes the last received message content by normalizing and augmenting it
+        with descriptions of any included images. The function supports input content
+        as either a string or a list of dictionaries, where each dictionary represents
+        a content item (e.g., text, image). If the content contains image URLs, it
+        fetches the image data, generates a caption for each image, and inserts the
+        caption into the augmented content.
+
+        The function aims to transform the content into a format compatible with GPT-4V
+        multimodal inputs, specifically by formatting strings into PIL-compatible
+        images if needed and appending text descriptions for images. This allows for
+        a more accessible presentation of the content, especially in contexts where
+        images cannot be displayed directly.
+
+        Args:
+            content (Union[str, List[dict[str, Any]]]): The last received message content, which
+                can be a plain text string or a list of dictionaries representing
+                different types of content items (e.g., text, image_url).
+
+        Returns:
+            str: The augmented message content
+
+        Raises:
+            AssertionError: If an item in the content list is not a dictionary.
+
+        Examples:
+            Assuming `self._get_image_caption(img_data)` returns
+            "A beautiful sunset over the mountains" for the image.
+
+        - Input as String:
+            content = "Check out this cool photo!"
+            Output: "Check out this cool photo!"
+            (Content is a string without an image, remains unchanged.)
+
+        - Input as String, with image location:
+            content = "What's weather in this cool photo: `<img http://example.com/photo.jpg>`"
+            Output: "What's weather in this cool photo: `<img http://example.com/photo.jpg>` in case you can not see, the caption of this image is:
+            A beautiful sunset over the mountains\n"
+            (Caption added after the image)
+
+        - Input as List with Text Only:
+            content = `[{"type": "text", "text": "Here's an interesting fact."}]`
+            Output: "Here's an interesting fact."
+            (No images in the content, it remains unchanged.)
+
+        - Input as List with Image URL:
+            ```python
+            content = [
+                {"type": "text", "text": "What's weather in this cool photo:"},
+                {"type": "image_url", "image_url": "http://example.com/photo.jpg"},
+            ]
+            ```
+            Output: "What's weather in this cool photo: `<img http://example.com/photo.jpg>` in case you can not see, the caption of this image is:
+            A beautiful sunset over the mountains\n"
+            (Caption added after the image)
+        """
+        copy.deepcopy(content)
+        # normalize the content into the gpt-4v format for multimodal
+        # we want to keep the URL format to keep it concise.
+        if isinstance(content, str):
+            content = gpt4v_formatter(content, img_format="url")
+
+        aug_content: str = ""
+        for item in content:
+            assert isinstance(item, dict)
+            if item["type"] == "text":
+                aug_content += item["text"]
+            elif item["type"] == "image_url":
+                img_url = item["image_url"]
+                img_caption = ""
+
+                if self._custom_caption_func:
+                    img_caption = self._custom_caption_func(img_url, get_pil_image(img_url), self._lmm_client)
+                elif self._lmm_client:
+                    img_data = get_image_data(img_url)
+                    img_caption = self._get_image_caption(img_data)
+                else:
+                    img_caption = ""
+
+                aug_content += f"<img {img_url}> in case you can not see, the caption of this image is: {img_caption}\n"
+            else:
+                print(f"Warning: the input type should either be `test` or `image_url`. Skip {item['type']} here.")
+
+        return aug_content
+
+    def _get_image_caption(self, img_data: str) -> str:
+        """Args:
+            img_data (str): base64 encoded image data.
+
+        Returns:
+            str: caption for the given image.
+        """
+        response = self._lmm_client.create(
+            context=None,
+            messages=[
+                {
+                    "role": "user",
+                    "content": [
+                        {"type": "text", "text": self._description_prompt},
+                        {
+                            "type": "image_url",
+                            "image_url": convert_base64_to_data_uri(img_data),
+                        },
+                    ],
+                }
+            ],
+        )
+        description = response.choices[0].message.content
+        return content_str(description)
diff --git a/mm_agents/coact/autogen/agentchat/contrib/img_utils.py b/mm_agents/coact/autogen/agentchat/contrib/img_utils.py
new file mode 100644
index 0000000..be88a33
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/img_utils.py
@@ -0,0 +1,411 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import base64
+import copy
+import os
+import re
+from io import BytesIO
+from math import ceil
+from typing import Any, Union
+
+import requests
+
+from ...import_utils import optional_import_block, require_optional_import
+from .. import utils
+
+with optional_import_block():
+    from PIL import Image
+
+
+# Parameters for token counting for images for different models
+MODEL_PARAMS = {
+    "gpt-4-vision": {
+        "max_edge": 2048,
+        "min_edge": 768,
+        "tile_size": 512,
+        "base_token_count": 85,
+        "token_multiplier": 170,
+    },
+    "gpt-4o-mini": {
+        "max_edge": 2048,
+        "min_edge": 768,
+        "tile_size": 512,
+        "base_token_count": 2833,
+        "token_multiplier": 5667,
+    },
+    "gpt-4o": {"max_edge": 2048, "min_edge": 768, "tile_size": 512, "base_token_count": 85, "token_multiplier": 170},
+}
+
+
+@require_optional_import("PIL", "unknown")
+def get_pil_image(image_file: Union[str, "Image.Image"]) -> "Image.Image":
+    """Loads an image from a file and returns a PIL Image object.
+
+    Parameters:
+        image_file (str, or Image): The filename, URL, URI, or base64 string of the image file.
+
+    Returns:
+        Image.Image: The PIL Image object.
+    """
+    if isinstance(image_file, Image.Image):
+        # Already a PIL Image object
+        return image_file
+
+    # Remove quotes if existed
+    if image_file.startswith('"') and image_file.endswith('"'):
+        image_file = image_file[1:-1]
+    if image_file.startswith("'") and image_file.endswith("'"):
+        image_file = image_file[1:-1]
+
+    if image_file.startswith("http://") or image_file.startswith("https://"):
+        # A URL file
+        response = requests.get(image_file)
+        content = BytesIO(response.content)
+        image = Image.open(content)
+    # Match base64-encoded image URIs for supported formats: jpg, jpeg, png, gif, bmp, webp
+    elif re.match(r"data:image/(?:jpg|jpeg|png|gif|bmp|webp);base64,", image_file):
+        # A URI. Remove the prefix and decode the base64 string.
+        base64_data = re.sub(r"data:image/(?:jpg|jpeg|png|gif|bmp|webp);base64,", "", image_file)
+        image = _to_pil(base64_data)
+    elif os.path.exists(image_file):
+        # A local file
+        image = Image.open(image_file)
+    else:
+        # base64 encoded string
+        image = _to_pil(image_file)
+
+    return image.convert("RGB")
+
+
+@require_optional_import("PIL", "unknown")
+def get_image_data(image_file: Union[str, "Image.Image"], use_b64=True) -> bytes:
+    """Loads an image and returns its data either as raw bytes or in base64-encoded format.
+
+    This function first loads an image from the specified file, URL, or base64 string using
+    the `get_pil_image` function. It then saves this image in memory in PNG format and
+    retrieves its binary content. Depending on the `use_b64` flag, this binary content is
+    either returned directly or as a base64-encoded string.
+
+    Parameters:
+        image_file (str, or Image): The path to the image file, a URL to an image, or a base64-encoded
+                          string of the image.
+        use_b64 (bool): If True, the function returns a base64-encoded string of the image data.
+                        If False, it returns the raw byte data of the image. Defaults to True.
+
+    Returns:
+        bytes: The image data in raw bytes if `use_b64` is False, or a base64-encoded string
+               if `use_b64` is True.
+    """
+    image = get_pil_image(image_file)
+
+    buffered = BytesIO()
+    image.save(buffered, format="PNG")
+    content = buffered.getvalue()
+
+    if use_b64:
+        return base64.b64encode(content).decode("utf-8")
+    else:
+        return content
+
+
+@require_optional_import("PIL", "unknown")
+def llava_formatter(prompt: str, order_image_tokens: bool = False) -> tuple[str, list[str]]:
+    """Formats the input prompt by replacing image tags and returns the new prompt along with image locations.
+
+    Parameters:
+        - prompt (str): The input string that may contain image tags like `<img ...>`.
+        - order_image_tokens (bool, optional): Whether to order the image tokens with numbers.
+            It will be useful for GPT-4V. Defaults to False.
+
+    Returns:
+        - Tuple[str, List[str]]: A tuple containing the formatted string and a list of images (loaded in b64 format).
+    """
+    # Initialize variables
+    new_prompt = prompt
+    image_locations = []
+    images = []
+    image_count = 0
+
+    # Regular expression pattern for matching <img ...> tags
+    img_tag_pattern = re.compile(r"<img ([^>]+)>")
+
+    # Find all image tags
+    for match in img_tag_pattern.finditer(prompt):
+        image_location = match.group(1)
+
+        try:
+            img_data = get_image_data(image_location)
+        except Exception as e:
+            # Remove the token
+            print(f"Warning! Unable to load image from {image_location}, because of {e}")
+            new_prompt = new_prompt.replace(match.group(0), "", 1)
+            continue
+
+        image_locations.append(image_location)
+        images.append(img_data)
+
+        # Increment the image count and replace the tag in the prompt
+        new_token = f"<image {image_count}>" if order_image_tokens else "<image>"
+
+        new_prompt = new_prompt.replace(match.group(0), new_token, 1)
+        image_count += 1
+
+    return new_prompt, images
+
+
+@require_optional_import("PIL", "unknown")
+def pil_to_data_uri(image: "Image.Image") -> str:
+    """Converts a PIL Image object to a data URI.
+
+    Parameters:
+        image (Image.Image): The PIL Image object.
+
+    Returns:
+        str: The data URI string.
+    """
+    buffered = BytesIO()
+    image.save(buffered, format="PNG")
+    content = buffered.getvalue()
+    return convert_base64_to_data_uri(base64.b64encode(content).decode("utf-8"))
+
+
+def convert_base64_to_data_uri(base64_image):
+    def _get_mime_type_from_data_uri(base64_image):
+        # Decode the base64 string
+        image_data = base64.b64decode(base64_image)
+        # Check the first few bytes for known signatures
+        if image_data.startswith(b"\xff\xd8\xff"):
+            return "image/jpeg"
+        elif image_data.startswith(b"\x89PNG\r\n\x1a\n"):
+            return "image/png"
+        elif image_data.startswith(b"GIF87a") or image_data.startswith(b"GIF89a"):
+            return "image/gif"
+        elif image_data.startswith(b"RIFF") and image_data[8:12] == b"WEBP":
+            return "image/webp"
+        return "image/jpeg"  # use jpeg for unknown formats, best guess.
+
+    mime_type = _get_mime_type_from_data_uri(base64_image)
+    data_uri = f"data:{mime_type};base64,{base64_image}"
+    return data_uri
+
+
+@require_optional_import("PIL", "unknown")
+def gpt4v_formatter(prompt: str, img_format: str = "uri") -> list[Union[str, dict[str, Any]]]:
+    """Formats the input prompt by replacing image tags and returns a list of text and images.
+
+    Args:
+        prompt (str): The input string that may contain image tags like `<img ...>`.
+        img_format (str): what image format should be used. One of "uri", "url", "pil".
+
+    Returns:
+        List[Union[str, dict[str, Any]]]: A list of alternating text and image dictionary items.
+    """
+    assert img_format in ["uri", "url", "pil"]
+
+    output = []
+    last_index = 0
+    image_count = 0
+
+    # Find all image tags
+    for parsed_tag in utils.parse_tags_from_content("img", prompt):
+        image_location = parsed_tag["attr"]["src"]
+        try:
+            if img_format == "pil":
+                img_data = get_pil_image(image_location)
+            elif img_format == "uri":
+                img_data = get_image_data(image_location)
+                img_data = convert_base64_to_data_uri(img_data)
+            elif img_format == "url":
+                img_data = image_location
+            else:
+                raise ValueError(f"Unknown image format {img_format}")
+        except Exception as e:
+            # Warning and skip this token
+            print(f"Warning! Unable to load image from {image_location}, because {e}")
+            continue
+
+        # Add text before this image tag to output list
+        output.append({"type": "text", "text": prompt[last_index : parsed_tag["match"].start()]})
+
+        # Add image data to output list
+        output.append({"type": "image_url", "image_url": {"url": img_data}})
+
+        last_index = parsed_tag["match"].end()
+        image_count += 1
+
+    # Add remaining text to output list
+    if last_index < len(prompt):
+        output.append({"type": "text", "text": prompt[last_index:]})
+    return output
+
+
+def extract_img_paths(paragraph: str) -> list:
+    """Extract image paths (URLs or local paths) from a text paragraph.
+
+    Parameters:
+        paragraph (str): The input text paragraph.
+
+    Returns:
+        list: A list of extracted image paths.
+    """
+    # Regular expression to match image URLs and file paths.
+    # This regex detects URLs and file paths with common image extensions, including support for the webp format.
+    img_path_pattern = re.compile(
+        r"\b(?:http[s]?://\S+\.(?:jpg|jpeg|png|gif|bmp|webp)|\S+\.(?:jpg|jpeg|png|gif|bmp|webp))\b", re.IGNORECASE
+    )
+
+    # Find all matches in the paragraph
+    img_paths = re.findall(img_path_pattern, paragraph)
+    return img_paths
+
+
+@require_optional_import("PIL", "unknown")
+def _to_pil(data: str) -> "Image.Image":
+    """Converts a base64 encoded image data string to a PIL Image object.
+
+    This function first decodes the base64 encoded string to bytes, then creates a BytesIO object from the bytes,
+    and finally creates and returns a PIL Image object from the BytesIO object.
+
+    Parameters:
+        data (str): The encoded image data string.
+
+    Returns:
+        Image.Image: The PIL Image object created from the input data.
+    """
+    return Image.open(BytesIO(base64.b64decode(data)))
+
+
+@require_optional_import("PIL", "unknown")
+def message_formatter_pil_to_b64(messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Converts the PIL image URLs in the messages to base64 encoded data URIs.
+
+    This function iterates over a list of message dictionaries. For each message,
+    if it contains a 'content' key with a list of items, it looks for items
+    with an 'image_url' key. The function then converts the PIL image URL
+    (pointed to by 'image_url') to a base64 encoded data URI.
+
+    Parameters:
+        messages (List[Dict]): A list of message dictionaries. Each dictionary
+                               may contain a 'content' key with a list of items,
+                               some of which might be image URLs.
+
+    Returns:
+        List[Dict]: A new list of message dictionaries with PIL image URLs in the
+                    'image_url' key converted to base64 encoded data URIs.
+
+    Example Input:
+        example 1:
+        ```python
+        [
+            {'content': [{'type': 'text', 'text': 'You are a helpful AI assistant.'}], 'role': 'system'},
+            {'content': [
+                {'type': 'text', 'text': "What's the breed of this dog here?"},
+                {'type': 'image_url', 'image_url': {'url': a PIL.Image.Image}},
+                {'type': 'text', 'text': '.'}],
+            'role': 'user'}
+        ]
+        ```
+
+    Example Output:
+        example 1:
+        ```python
+        [
+            {'content': [{'type': 'text', 'text': 'You are a helpful AI assistant.'}], 'role': 'system'},
+            {'content': [
+                {'type': 'text', 'text': "What's the breed of this dog here?"},
+                {'type': 'image_url', 'image_url': {'url': a B64 Image}},
+                {'type': 'text', 'text': '.'}],
+            'role': 'user'}
+        ]
+        ```
+    """
+    new_messages = []
+    for message in messages:
+        # deepcopy to avoid modifying the original message.
+        message = copy.deepcopy(message)
+        if isinstance(message, dict) and "content" in message:
+            # First, if the content is a string, parse it into a list of parts.
+            # This is for tool output that contains images.
+            if isinstance(message["content"], str):
+                message["content"] = gpt4v_formatter(message["content"], img_format="pil")
+
+            # Second, if the content is a list, process any image parts.
+            if isinstance(message["content"], list):
+                for item in message["content"]:
+                    if (
+                        isinstance(item, dict)
+                        and "image_url" in item
+                        and isinstance(item["image_url"]["url"], Image.Image)
+                    ):
+                        item["image_url"]["url"] = pil_to_data_uri(item["image_url"]["url"])
+
+        new_messages.append(message)
+
+    return new_messages
+
+
+@require_optional_import("PIL", "unknown")
+def num_tokens_from_gpt_image(
+    image_data: Union[str, "Image.Image"], model: str = "gpt-4-vision", low_quality: bool = False
+) -> int:
+    """Calculate the number of tokens required to process an image based on its dimensions
+    after scaling for different GPT models. Supports "gpt-4-vision", "gpt-4o", and "gpt-4o-mini".
+    This function scales the image so that its longest edge is at most 2048 pixels and its shortest
+    edge is at most 768 pixels (for "gpt-4-vision"). It then calculates the number of 512x512 tiles
+    needed to cover the scaled image and computes the total tokens based on the number of these tiles.
+
+    Reference: https://openai.com/api/pricing/
+
+    Args:
+        image_data : Union[str, Image.Image]: The image data which can either be a base64 encoded string, a URL, a file path, or a PIL Image object.
+        model: str: The model being used for image processing. Can be "gpt-4-vision", "gpt-4o", or "gpt-4o-mini".
+        low_quality: bool: Whether to use low-quality processing. Defaults to False.
+
+    Returns:
+        int: The total number of tokens required for processing the image.
+
+    Examples:
+    --------
+    >>> from PIL import Image
+    >>> img = Image.new("RGB", (2500, 2500), color="red")
+    >>> num_tokens_from_gpt_image(img, model="gpt-4-vision")
+    765
+    """
+    image = get_pil_image(image_data)  # PIL Image
+    width, height = image.size
+
+    # Determine model parameters
+    if "gpt-4-vision" in model or "gpt-4-turbo" in model or "gpt-4v" in model or "gpt-4-v" in model:
+        params = MODEL_PARAMS["gpt-4-vision"]
+    elif "gpt-4o-mini" in model:
+        params = MODEL_PARAMS["gpt-4o-mini"]
+    elif "gpt-4o" in model:
+        params = MODEL_PARAMS["gpt-4o"]
+    else:
+        raise ValueError(
+            f"Model {model} is not supported. Choose 'gpt-4-vision', 'gpt-4-turbo', 'gpt-4v', 'gpt-4-v', 'gpt-4o', or 'gpt-4o-mini'."
+        )
+
+    if low_quality:
+        return params["base_token_count"]
+
+    # 1. Constrain the longest edge
+    if max(width, height) > params["max_edge"]:
+        scale_factor = params["max_edge"] / max(width, height)
+        width, height = int(width * scale_factor), int(height * scale_factor)
+
+    # 2. Further constrain the shortest edge
+    if min(width, height) > params["min_edge"]:
+        scale_factor = params["min_edge"] / min(width, height)
+        width, height = int(width * scale_factor), int(height * scale_factor)
+
+    # 3. Count how many tiles are needed to cover the image
+    tiles_width = ceil(width / params["tile_size"])
+    tiles_height = ceil(height / params["tile_size"])
+    total_tokens = params["base_token_count"] + params["token_multiplier"] * (tiles_width * tiles_height)
+
+    return total_tokens
diff --git a/mm_agents/coact/autogen/agentchat/contrib/multimodal_conversable_agent.py b/mm_agents/coact/autogen/agentchat/contrib/multimodal_conversable_agent.py
new file mode 100644
index 0000000..d37fff0
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/contrib/multimodal_conversable_agent.py
@@ -0,0 +1,153 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import copy
+from typing import Any, Optional, Union
+
+from ... import OpenAIWrapper
+from ...code_utils import content_str
+from .. import Agent, ConversableAgent
+from ..contrib.img_utils import (
+    gpt4v_formatter,
+    message_formatter_pil_to_b64,
+)
+
+DEFAULT_LMM_SYS_MSG = """You are a helpful AI assistant."""
+DEFAULT_MODEL = "gpt-4-vision-preview"
+
+
+class MultimodalConversableAgent(ConversableAgent):
+    DEFAULT_CONFIG = {
+        "model": DEFAULT_MODEL,
+    }
+
+    def __init__(
+        self,
+        name: str,
+        system_message: Optional[Union[str, list]] = DEFAULT_LMM_SYS_MSG,
+        is_termination_msg: str = None,
+        *args,
+        **kwargs: Any,
+    ):
+        """Args:
+        name (str): agent name.
+        system_message (str): system message for the OpenAIWrapper inference.
+            Please override this attribute if you want to reprogram the agent.
+        **kwargs (dict): Please refer to other kwargs in
+            [ConversableAgent](/docs/api-reference/autogen/ConversableAgent#conversableagent).
+        """
+        super().__init__(
+            name,
+            system_message,
+            is_termination_msg=is_termination_msg,
+            *args,
+            **kwargs,
+        )
+        # call the setter to handle special format.
+        self.update_system_message(system_message)
+        self._is_termination_msg = (
+            is_termination_msg
+            if is_termination_msg is not None
+            else (lambda x: content_str(x.get("content")) == "TERMINATE")
+        )
+
+        # Override the `generate_oai_reply`
+        self.replace_reply_func(ConversableAgent.generate_oai_reply, MultimodalConversableAgent.generate_oai_reply)
+        self.replace_reply_func(
+            ConversableAgent.a_generate_oai_reply,
+            MultimodalConversableAgent.a_generate_oai_reply,
+        )
+
+    def update_system_message(self, system_message: Union[dict[str, Any], list[str], str]):
+        """Update the system message.
+
+        Args:
+            system_message (str): system message for the OpenAIWrapper inference.
+        """
+        self._oai_system_message[0]["content"] = self._message_to_dict(system_message)["content"]
+        self._oai_system_message[0]["role"] = "system"
+
+    @staticmethod
+    def _message_to_dict(message: Union[dict[str, Any], list[str], str]) -> dict:
+        """Convert a message to a dictionary. This implementation
+        handles the GPT-4V formatting for easier prompts.
+
+        The message can be a string, a dictionary, or a list of dictionaries:
+            - If it's a string, it will be cast into a list and placed in the 'content' field.
+            - If it's a list, it will be directly placed in the 'content' field.
+            - If it's a dictionary, it is already in message dict format. The 'content' field of this dictionary
+            will be processed using the gpt4v_formatter.
+        """
+        if isinstance(message, str):
+            return {"content": gpt4v_formatter(message, img_format="pil")}
+        if isinstance(message, list):
+            return {"content": message}
+        if isinstance(message, dict):
+            assert "content" in message, "The message dict must have a `content` field"
+            if isinstance(message["content"], str):
+                message = copy.deepcopy(message)
+                message["content"] = gpt4v_formatter(message["content"], img_format="pil")
+            try:
+                content_str(message["content"])
+            except (TypeError, ValueError) as e:
+                print("The `content` field should be compatible with the content_str function!")
+                raise e
+            return message
+        raise ValueError(f"Unsupported message type: {type(message)}")
+
+    def generate_oai_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[OpenAIWrapper] = None,
+    ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        """Generate a reply using autogen.oai."""
+        client = self.client if config is None else config
+        if client is None:
+            return False, None
+        if messages is None:
+            messages = self._oai_messages[sender]
+
+        messages_with_b64_img = message_formatter_pil_to_b64(self._oai_system_message + messages)
+
+        new_messages = []
+        for message in messages_with_b64_img:
+            if 'tool_responses' in message:
+                for tool_response in message['tool_responses']:
+                    tmp_image = None
+                    tmp_list = []
+                    for ctx in message['content']:
+                        if ctx['type'] == 'image_url':
+                            tmp_image = ctx
+                    tmp_list.append({
+                        'role': 'tool',
+                        'tool_call_id': tool_response['tool_call_id'],
+                        'content': [message['content'][0]]
+                    })
+                    if tmp_image:
+                        tmp_list.append({
+                            'role': 'user',
+                            'content': [
+                                {'type': 'text', 'text': 'I take a screenshot for the current state for you.'},
+                                tmp_image
+                            ]
+                        })
+                    new_messages.extend(tmp_list)
+            else:
+                new_messages.append(message)
+        messages_with_b64_img = new_messages.copy()
+
+
+        # TODO: #1143 handle token limit exceeded error
+        response = client.create(
+            context=messages[-1].pop("context", None), messages=messages_with_b64_img, agent=self.name
+        )
+
+        # TODO: line 301, line 271 is converting messages to dict. Can be removed after ChatCompletionMessage_to_dict is merged.
+        extracted_response = client.extract_text_or_completion_object(response)[0]
+        if not isinstance(extracted_response, str):
+            extracted_response = extracted_response.model_dump()
+        return True, extracted_response
diff --git a/mm_agents/coact/autogen/agentchat/conversable_agent.py b/mm_agents/coact/autogen/agentchat/conversable_agent.py
new file mode 100644
index 0000000..e4ee85f
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/conversable_agent.py
@@ -0,0 +1,4023 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import asyncio
+import copy
+import functools
+import inspect
+import json
+import logging
+import re
+import threading
+import warnings
+from collections import defaultdict
+from contextlib import contextmanager
+from dataclasses import dataclass
+from inspect import signature
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    Callable,
+    Generator,
+    Iterable,
+    Literal,
+    Optional,
+    TypeVar,
+    Union,
+)
+
+from ..cache.cache import AbstractCache, Cache
+from ..code_utils import (
+    PYTHON_VARIANTS,
+    UNKNOWN,
+    check_can_use_docker_or_throw,
+    content_str,
+    decide_use_docker,
+    execute_code,
+    extract_code,
+    infer_lang,
+)
+from ..coding.base import CodeExecutor
+from ..coding.factory import CodeExecutorFactory
+from ..doc_utils import export_module
+from ..events.agent_events import (
+    ClearConversableAgentHistoryEvent,
+    ClearConversableAgentHistoryWarningEvent,
+    ConversableAgentUsageSummaryEvent,
+    ConversableAgentUsageSummaryNoCostIncurredEvent,
+    ErrorEvent,
+    ExecuteCodeBlockEvent,
+    ExecuteFunctionEvent,
+    ExecutedFunctionEvent,
+    GenerateCodeExecutionReplyEvent,
+    PostCarryoverProcessingEvent,
+    RunCompletionEvent,
+    TerminationAndHumanReplyNoInputEvent,
+    TerminationEvent,
+    UsingAutoReplyEvent,
+    create_received_event_model,
+)
+from ..exception_utils import InvalidCarryOverTypeError, SenderRequiredError
+from ..io.base import IOStream
+from ..io.run_response import AsyncRunResponse, AsyncRunResponseProtocol, RunResponse, RunResponseProtocol
+from ..io.thread_io_stream import AsyncThreadIOStream, ThreadIOStream
+from ..llm_config import LLMConfig
+from ..oai.client import ModelClient, OpenAIWrapper
+from ..runtime_logging import log_event, log_function_use, log_new_agent, logging_enabled
+from ..tools import ChatContext, Tool, load_basemodels_if_needed, serialize_to_str
+from .agent import Agent, LLMAgent
+from .chat import (
+    ChatResult,
+    _post_process_carryover_item,
+    _validate_recipients,
+    a_initiate_chats,
+    initiate_chats,
+)
+from .group.context_variables import ContextVariables
+from .group.handoffs import Handoffs
+from .utils import consolidate_chat_info, gather_usage_summary
+
+if TYPE_CHECKING:
+    from .group.on_condition import OnCondition
+    from .group.on_context_condition import OnContextCondition
+
+__all__ = ("ConversableAgent",)
+
+logger = logging.getLogger(__name__)
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+@dataclass
+@export_module("autogen")
+class UpdateSystemMessage:
+    """Update the agent's system message before they reply
+
+    Args:
+        content_updater: The format string or function to update the agent's system message. Can be a format string or a Callable.
+            If a string, it will be used as a template and substitute the context variables.
+            If a Callable, it should have the signature:
+                def my_content_updater(agent: ConversableAgent, messages: List[Dict[str, Any]]) -> str
+    """
+
+    content_updater: Union[Callable, str]
+
+    def __post_init__(self):
+        if isinstance(self.content_updater, str):
+            # find all {var} in the string
+            vars = re.findall(r"\{(\w+)\}", self.content_updater)
+            if len(vars) == 0:
+                warnings.warn("Update function string contains no variables. This is probably unintended.")
+
+        elif isinstance(self.content_updater, Callable):
+            sig = signature(self.content_updater)
+            if len(sig.parameters) != 2:
+                raise ValueError(
+                    "The update function must accept two parameters of type ConversableAgent and List[Dict[str, Any]], respectively"
+                )
+            if sig.return_annotation != str:
+                raise ValueError("The update function must return a string")
+        else:
+            raise ValueError("The update function must be either a string or a callable")
+
+
+@export_module("autogen")
+class ConversableAgent(LLMAgent):
+    """(In preview) A class for generic conversable agents which can be configured as assistant or user proxy.
+
+    After receiving each message, the agent will send a reply to the sender unless the msg is a termination msg.
+    For example, AssistantAgent and UserProxyAgent are subclasses of this class,
+    configured with different default settings.
+
+    To modify auto reply, override `generate_reply` method.
+    To disable/enable human response in every turn, set `human_input_mode` to "NEVER" or "ALWAYS".
+    To modify the way to get human input, override `get_human_input` method.
+    To modify the way to execute code blocks, single code block, or function call, override `execute_code_blocks`,
+    `run_code`, and `execute_function` methods respectively.
+    """
+
+    DEFAULT_CONFIG = False  # False or dict, the default config for llm inference
+    MAX_CONSECUTIVE_AUTO_REPLY = 100  # maximum number of consecutive auto replies (subject to future change)
+
+    DEFAULT_SUMMARY_PROMPT = "Summarize the takeaway from the conversation. Do not add any introductory phrases."
+    DEFAULT_SUMMARY_METHOD = "last_msg"
+    llm_config: Union[dict[str, Any], Literal[False]]
+
+    def __init__(
+        self,
+        name: str,
+        system_message: Optional[Union[str, list]] = "You are a helpful AI Assistant.",
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        human_input_mode: Literal["ALWAYS", "NEVER", "TERMINATE"] = "TERMINATE",
+        function_map: Optional[dict[str, Callable[..., Any]]] = None,
+        code_execution_config: Union[dict[str, Any], Literal[False]] = False,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = None,
+        default_auto_reply: Union[str, dict[str, Any]] = "",
+        description: Optional[str] = None,
+        chat_messages: Optional[dict[Agent, list[dict[str, Any]]]] = None,
+        silent: Optional[bool] = None,
+        context_variables: Optional["ContextVariables"] = None,
+        functions: Union[list[Callable[..., Any]], Callable[..., Any]] = None,
+        update_agent_state_before_reply: Optional[
+            Union[list[Union[Callable, UpdateSystemMessage]], Callable, UpdateSystemMessage]
+        ] = None,
+        handoffs: Optional[Handoffs] = None,
+    ):
+        """
+        Args:
+            name (str): name of the agent.
+            system_message (str or list): system message for the ChatCompletion inference.
+            is_termination_msg (function): a function that takes a message in the form of a dictionary
+                and returns a boolean value indicating if this received message is a termination message.
+                The dict can contain the following keys: "content", "role", "name", "function_call".
+            max_consecutive_auto_reply (int): the maximum number of consecutive auto replies.
+                default to None (no limit provided, class attribute MAX_CONSECUTIVE_AUTO_REPLY will be used as the limit in this case).
+                When set to 0, no auto reply will be generated.
+            human_input_mode (str): whether to ask for human inputs every time a message is received.
+                Possible values are "ALWAYS", "TERMINATE", "NEVER".
+                (1) When "ALWAYS", the agent prompts for human input every time a message is received.
+                    Under this mode, the conversation stops when the human input is "exit",
+                    or when is_termination_msg is True and there is no human input.
+                (2) When "TERMINATE", the agent only prompts for human input only when a termination message is received or
+                    the number of auto reply reaches the max_consecutive_auto_reply.
+                (3) When "NEVER", the agent will never prompt for human input. Under this mode, the conversation stops
+                    when the number of auto reply reaches the max_consecutive_auto_reply or when is_termination_msg is True.
+            function_map (dict[str, callable]): Mapping function names (passed to openai) to callable functions, also used for tool calls.
+            code_execution_config (dict or False): config for the code execution.
+                To disable code execution, set to False. Otherwise, set to a dictionary with the following keys:
+                - work_dir (Optional, str): The working directory for the code execution.
+                    If None, a default working directory will be used.
+                    The default working directory is the "extensions" directory under
+                    "path_to_autogen".
+                - use_docker (Optional, list, str or bool): The docker image to use for code execution.
+                    Default is True, which means the code will be executed in a docker container. A default list of images will be used.
+                    If a list or a str of image name(s) is provided, the code will be executed in a docker container
+                    with the first image successfully pulled.
+                    If False, the code will be executed in the current environment.
+                    We strongly recommend using docker for code execution.
+                - timeout (Optional, int): The maximum execution time in seconds.
+                - last_n_messages (Experimental, int or str): The number of messages to look back for code execution.
+                    If set to 'auto', it will scan backwards through all messages arriving since the agent last spoke, which is typically the last time execution was attempted. (Default: auto)
+            llm_config (LLMConfig or dict or False or None): llm inference configuration.
+                Please refer to [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create)
+                for available options.
+                When using OpenAI or Azure OpenAI endpoints, please specify a non-empty 'model' either in `llm_config` or in each config of 'config_list' in `llm_config`.
+                To disable llm-based auto reply, set to False.
+                When set to None, will use self.DEFAULT_CONFIG, which defaults to False.
+            default_auto_reply (str or dict): default auto reply when no code execution or llm-based reply is generated.
+            description (str): a short description of the agent. This description is used by other agents
+                (e.g. the GroupChatManager) to decide when to call upon this agent. (Default: system_message)
+            chat_messages (dict or None): the previous chat messages that this agent had in the past with other agents.
+                Can be used to give the agent a memory by providing the chat history. This will allow the agent to
+                resume previous had conversations. Defaults to an empty chat history.
+            silent (bool or None): (Experimental) whether to print the message sent. If None, will use the value of
+                silent in each function.
+            context_variables (ContextVariables or None): Context variables that provide a persistent context for the agent.
+                Note: This will be a reference to a shared context for multi-agent chats.
+                Behaves like a dictionary with keys and values (akin to dict[str, Any]).
+            functions (List[Callable[..., Any]]): A list of functions to register with the agent, these will be wrapped up as tools and registered for LLM (not execution).
+            update_agent_state_before_reply (List[Callable[..., Any]]): A list of functions, including UpdateSystemMessage's, called to update the agent before it replies.
+            handoffs (Handoffs): Handoffs object containing all handoff transition conditions.
+        """
+        self.handoffs = handoffs if handoffs is not None else Handoffs()
+
+        # we change code_execution_config below and we have to make sure we don't change the input
+        # in case of UserProxyAgent, without this we could even change the default value {}
+        code_execution_config = (
+            code_execution_config.copy() if hasattr(code_execution_config, "copy") else code_execution_config
+        )
+
+        # a dictionary of conversations, default value is list
+        if chat_messages is None:
+            self._oai_messages = defaultdict(list)
+        else:
+            self._oai_messages = chat_messages
+
+        self._oai_system_message = [{"content": system_message, "role": "system"}]
+        self._description = description if description is not None else system_message
+        self._is_termination_msg = (
+            is_termination_msg
+            if is_termination_msg is not None
+            else (lambda x: content_str(x.get("content")) == "TERMINATE")
+        )
+        self.silent = silent
+        self.run_executor: Optional[ConversableAgent] = None
+
+        # Take a copy to avoid modifying the given dict
+        if isinstance(llm_config, dict):
+            try:
+                llm_config = copy.deepcopy(llm_config)
+            except TypeError as e:
+                raise TypeError(
+                    "Please implement __deepcopy__ method for each value class in llm_config to support deepcopy."
+                    " Refer to the docs for more details: https://docs.ag2.ai/docs/user-guide/advanced-concepts/llm-configuration-deep-dive/#adding-http-client-in-llm_config-for-proxy"
+                ) from e
+
+        self.llm_config = self._validate_llm_config(llm_config)
+        self.client = self._create_client(self.llm_config)
+        self._validate_name(name)
+        self._name = name
+
+        if logging_enabled():
+            log_new_agent(self, locals())
+
+        # Initialize standalone client cache object.
+        self.client_cache = None
+
+        # To track UI tools
+        self._ui_tools: list[Tool] = []
+
+        self.human_input_mode = human_input_mode
+        self._max_consecutive_auto_reply = (
+            max_consecutive_auto_reply if max_consecutive_auto_reply is not None else self.MAX_CONSECUTIVE_AUTO_REPLY
+        )
+        self._consecutive_auto_reply_counter = defaultdict(int)
+        self._max_consecutive_auto_reply_dict = defaultdict(self.max_consecutive_auto_reply)
+        self._function_map = (
+            {}
+            if function_map is None
+            else {name: callable for name, callable in function_map.items() if self._assert_valid_name(name)}
+        )
+        self._default_auto_reply = default_auto_reply
+        self._reply_func_list = []
+        self._human_input = []
+        self.reply_at_receive = defaultdict(bool)
+        self.register_reply([Agent, None], ConversableAgent.generate_oai_reply)
+        self.register_reply([Agent, None], ConversableAgent.a_generate_oai_reply, ignore_async_in_sync_chat=True)
+
+        self.context_variables = context_variables if context_variables is not None else ContextVariables()
+
+        self._tools: list[Tool] = []
+
+        # Register functions to the agent
+        if isinstance(functions, list):
+            if not all(isinstance(func, Callable) for func in functions):
+                raise TypeError("All elements in the functions list must be callable")
+            self._add_functions(functions)
+        elif isinstance(functions, Callable):
+            self._add_single_function(functions)
+        elif functions is not None:
+            raise TypeError("Functions must be a callable or a list of callables")
+
+        # Setting up code execution.
+        # Do not register code execution reply if code execution is disabled.
+        if code_execution_config is not False:
+            # If code_execution_config is None, set it to an empty dict.
+            if code_execution_config is None:
+                warnings.warn(
+                    "Using None to signal a default code_execution_config is deprecated. "
+                    "Use {} to use default or False to disable code execution.",
+                    stacklevel=2,
+                )
+                code_execution_config = {}
+            if not isinstance(code_execution_config, dict):
+                raise ValueError("code_execution_config must be a dict or False.")
+
+            # We have got a valid code_execution_config.
+            self._code_execution_config: Union[dict[str, Any], Literal[False]] = code_execution_config
+
+            if self._code_execution_config.get("executor") is not None:
+                if "use_docker" in self._code_execution_config:
+                    raise ValueError(
+                        "'use_docker' in code_execution_config is not valid when 'executor' is set. Use the appropriate arg in the chosen executor instead."
+                    )
+
+                if "work_dir" in self._code_execution_config:
+                    raise ValueError(
+                        "'work_dir' in code_execution_config is not valid when 'executor' is set. Use the appropriate arg in the chosen executor instead."
+                    )
+
+                if "timeout" in self._code_execution_config:
+                    raise ValueError(
+                        "'timeout' in code_execution_config is not valid when 'executor' is set. Use the appropriate arg in the chosen executor instead."
+                    )
+
+                # Use the new code executor.
+                self._code_executor = CodeExecutorFactory.create(self._code_execution_config)
+                self.register_reply([Agent, None], ConversableAgent._generate_code_execution_reply_using_executor)
+            else:
+                # Legacy code execution using code_utils.
+                use_docker = self._code_execution_config.get("use_docker", None)
+                use_docker = decide_use_docker(use_docker)
+                check_can_use_docker_or_throw(use_docker)
+                self._code_execution_config["use_docker"] = use_docker
+                self.register_reply([Agent, None], ConversableAgent.generate_code_execution_reply)
+        else:
+            # Code execution is disabled.
+            self._code_execution_config = False
+
+        self.register_reply([Agent, None], ConversableAgent.generate_tool_calls_reply)
+        self.register_reply([Agent, None], ConversableAgent.a_generate_tool_calls_reply, ignore_async_in_sync_chat=True)
+        self.register_reply([Agent, None], ConversableAgent.generate_function_call_reply)
+        self.register_reply(
+            [Agent, None], ConversableAgent.a_generate_function_call_reply, ignore_async_in_sync_chat=True
+        )
+        self.register_reply([Agent, None], ConversableAgent.check_termination_and_human_reply)
+        self.register_reply(
+            [Agent, None], ConversableAgent.a_check_termination_and_human_reply, ignore_async_in_sync_chat=True
+        )
+
+        # Registered hooks are kept in lists, indexed by hookable method, to be called in their order of registration.
+        # New hookable methods should be added to this list as required to support new agent capabilities.
+        self.hook_lists: dict[str, list[Callable[..., Any]]] = {
+            "process_last_received_message": [],
+            "process_all_messages_before_reply": [],
+            "process_message_before_send": [],
+            "update_agent_state": [],
+        }
+
+        # Associate agent update state hooks
+        self._register_update_agent_state_before_reply(update_agent_state_before_reply)
+
+    def _validate_name(self, name: str) -> None:
+        if not self.llm_config:
+            return
+
+        if any([
+            entry for entry in self.llm_config.config_list if entry.api_type == "openai" and re.search(r"\s", name)
+        ]):
+            raise ValueError(f"The name of the agent cannot contain any whitespace. The name provided is: '{name}'")
+
+    def _get_display_name(self):
+        """Get the string representation of the agent.
+
+        If you would like to change the standard string representation for an
+        instance of ConversableAgent, you can point it to another function.
+        In this example a function called _group_agent_str that returns a string:
+        agent._get_display_name = MethodType(_group_agent_str, agent)
+        """
+        return self.name
+
+    def __str__(self):
+        return self._get_display_name()
+
+    def _add_functions(self, func_list: list[Callable[..., Any]]):
+        """Add (Register) a list of functions to the agent
+
+        Args:
+            func_list (list[Callable[..., Any]]): A list of functions to register with the agent."""
+        for func in func_list:
+            self._add_single_function(func)
+
+    def _add_single_function(self, func: Callable, name: Optional[str] = None, description: Optional[str] = ""):
+        """Add a single function to the agent
+
+        Args:
+            func (Callable): The function to register.
+            name (str): The name of the function. If not provided, the function's name will be used.
+            description (str): The description of the function, used by the LLM. If not provided, the function's docstring will be used.
+        """
+        if name:
+            func._name = name
+        elif not hasattr(func, "_name"):
+            func._name = func.__name__
+
+        if hasattr(func, "_description") and func._description and not description:
+            # If the function already has a description, use it
+            description = func._description
+        else:
+            if description:
+                func._description = description
+            else:
+                # Use function's docstring, strip whitespace, fall back to empty string
+                description = (func.__doc__ or "").strip()
+                func._description = description
+
+        # Register the function
+        self.register_for_llm(name=name, description=description, silent_override=True)(func)
+
+    def _register_update_agent_state_before_reply(
+        self, functions: Optional[Union[list[Callable[..., Any]], Callable[..., Any]]]
+    ):
+        """
+        Register functions that will be called when the agent is selected and before it speaks.
+        You can add your own validation or precondition functions here.
+
+        Args:
+            functions (List[Callable[[], None]]): A list of functions to be registered. Each function
+                is called when the agent is selected and before it speaks.
+        """
+        if functions is None:
+            return
+        if not isinstance(functions, list) and type(functions) not in [UpdateSystemMessage, Callable[..., Any]]:
+            raise ValueError("functions must be a list of callables")
+
+        if not isinstance(functions, list):
+            functions = [functions]
+
+        for func in functions:
+            if isinstance(func, UpdateSystemMessage):
+                # Wrapper function that allows this to be used in the update_agent_state hook
+                # Its primary purpose, however, is just to update the agent's system message
+                # Outer function to create a closure with the update function
+                def create_wrapper(update_func: UpdateSystemMessage):
+                    def update_system_message_wrapper(
+                        agent: ConversableAgent, messages: list[dict[str, Any]]
+                    ) -> list[dict[str, Any]]:
+                        if isinstance(update_func.content_updater, str):
+                            # Templates like "My context variable passport is {passport}" will
+                            # use the context_variables for substitution
+                            sys_message = OpenAIWrapper.instantiate(
+                                template=update_func.content_updater,
+                                context=agent.context_variables.to_dict(),
+                                allow_format_str_template=True,
+                            )
+                        else:
+                            sys_message = update_func.content_updater(agent, messages)
+
+                        agent.update_system_message(sys_message)
+                        return messages
+
+                    return update_system_message_wrapper
+
+                self.register_hook(hookable_method="update_agent_state", hook=create_wrapper(func))
+
+            else:
+                self.register_hook(hookable_method="update_agent_state", hook=func)
+
+    @classmethod
+    def _validate_llm_config(
+        cls, llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]]
+    ) -> Union[LLMConfig, Literal[False]]:
+        # if not(llm_config in (None, False) or isinstance(llm_config, [dict, LLMConfig])):
+        #     raise ValueError(
+        #         "llm_config must be a dict or False or None."
+        #     )
+
+        if llm_config is None:
+            llm_config = LLMConfig.get_current_llm_config()
+            if llm_config is None:
+                llm_config = cls.DEFAULT_CONFIG
+        elif isinstance(llm_config, dict):
+            llm_config = LLMConfig(**llm_config)
+        elif isinstance(llm_config, LLMConfig):
+            llm_config = llm_config.copy()
+        elif llm_config is False:
+            pass
+        else:
+            raise ValueError("llm_config must be a LLMConfig, dict or False or None.")
+
+        return llm_config
+
+    @classmethod
+    def _create_client(cls, llm_config: Union[LLMConfig, Literal[False]]) -> Optional[OpenAIWrapper]:
+        return None if llm_config is False else OpenAIWrapper(**llm_config)
+
+    @staticmethod
+    def _is_silent(agent: Agent, silent: Optional[bool] = False) -> bool:
+        return agent.silent if agent.silent is not None else silent
+
+    @property
+    def name(self) -> str:
+        """Get the name of the agent."""
+        return self._name
+
+    @property
+    def description(self) -> str:
+        """Get the description of the agent."""
+        return self._description
+
+    @description.setter
+    def description(self, description: str):
+        """Set the description of the agent."""
+        self._description = description
+
+    @property
+    def code_executor(self) -> Optional[CodeExecutor]:
+        """The code executor used by this agent. Returns None if code execution is disabled."""
+        if not hasattr(self, "_code_executor"):
+            return None
+        return self._code_executor
+
+    def register_reply(
+        self,
+        trigger: Union[type[Agent], str, Agent, Callable[[Agent], bool], list],
+        reply_func: Callable,
+        position: int = 0,
+        config: Optional[Any] = None,
+        reset_config: Optional[Callable[..., Any]] = None,
+        *,
+        ignore_async_in_sync_chat: bool = False,
+        remove_other_reply_funcs: bool = False,
+    ):
+        """Register a reply function.
+
+        The reply function will be called when the trigger matches the sender.
+        The function registered later will be checked earlier by default.
+        To change the order, set the position to a positive integer.
+
+        Both sync and async reply functions can be registered. The sync reply function will be triggered
+        from both sync and async chats. However, an async reply function will only be triggered from async
+        chats (initiated with `ConversableAgent.a_initiate_chat`). If an `async` reply function is registered
+        and a chat is initialized with a sync function, `ignore_async_in_sync_chat` determines the behaviour as follows:
+            if `ignore_async_in_sync_chat` is set to `False` (default value), an exception will be raised, and
+            if `ignore_async_in_sync_chat` is set to `True`, the reply function will be ignored.
+
+        Args:
+            trigger (Agent class, str, Agent instance, callable, or list): the trigger.
+                If a class is provided, the reply function will be called when the sender is an instance of the class.
+                If a string is provided, the reply function will be called when the sender's name matches the string.
+                If an agent instance is provided, the reply function will be called when the sender is the agent instance.
+                If a callable is provided, the reply function will be called when the callable returns True.
+                If a list is provided, the reply function will be called when any of the triggers in the list is activated.
+                If None is provided, the reply function will be called only when the sender is None.
+                Note: Be sure to register `None` as a trigger if you would like to trigger an auto-reply function with non-empty messages and `sender=None`.
+            reply_func (Callable): the reply function.
+                The function takes a recipient agent, a list of messages, a sender agent and a config as input and returns a reply message.
+
+                ```python
+                def reply_func(
+                    recipient: ConversableAgent,
+                    messages: Optional[List[Dict]] = None,
+                    sender: Optional[Agent] = None,
+                    config: Optional[Any] = None,
+                ) -> Tuple[bool, Union[str, Dict, None]]:
+                ```
+            position (int): the position of the reply function in the reply function list.
+                The function registered later will be checked earlier by default.
+                To change the order, set the position to a positive integer.
+            config (Any): the config to be passed to the reply function.
+                When an agent is reset, the config will be reset to the original value.
+            reset_config (Callable): the function to reset the config.
+                The function returns None. Signature: ```def reset_config(config: Any)```
+            ignore_async_in_sync_chat (bool): whether to ignore the async reply function in sync chats. If `False`, an exception
+                will be raised if an async reply function is registered and a chat is initialized with a sync
+                function.
+            remove_other_reply_funcs (bool): whether to remove other reply functions when registering this reply function.
+        """
+        if not isinstance(trigger, (type, str, Agent, Callable, list)):
+            raise ValueError("trigger must be a class, a string, an agent, a callable or a list.")
+        if remove_other_reply_funcs:
+            self._reply_func_list.clear()
+        self._reply_func_list.insert(
+            position,
+            {
+                "trigger": trigger,
+                "reply_func": reply_func,
+                "config": copy.copy(config),
+                "init_config": config,
+                "reset_config": reset_config,
+                "ignore_async_in_sync_chat": ignore_async_in_sync_chat and inspect.iscoroutinefunction(reply_func),
+            },
+        )
+
+    def replace_reply_func(self, old_reply_func: Callable, new_reply_func: Callable):
+        """Replace a registered reply function with a new one.
+
+        Args:
+            old_reply_func (Callable): the old reply function to be replaced.
+            new_reply_func (Callable): the new reply function to replace the old one.
+        """
+        for f in self._reply_func_list:
+            if f["reply_func"] == old_reply_func:
+                f["reply_func"] = new_reply_func
+
+    @staticmethod
+    def _get_chats_to_run(
+        chat_queue: list[dict[str, Any]],
+        recipient: Agent,
+        messages: Optional[list[dict[str, Any]]],
+        sender: Agent,
+        config: Any,
+    ) -> list[dict[str, Any]]:
+        """A simple chat reply function.
+        This function initiate one or a sequence of chats between the "recipient" and the agents in the
+        chat_queue.
+
+        It extracts and returns a summary from the nested chat based on the "summary_method" in each chat in chat_queue.
+
+        Returns:
+            Tuple[bool, str]: A tuple where the first element indicates the completion of the chat, and the second element contains the summary of the last chat if any chats were initiated.
+        """
+        last_msg = messages[-1].get("content")
+        chat_to_run = []
+        for i, c in enumerate(chat_queue):
+            current_c = c.copy()
+            if current_c.get("sender") is None:
+                current_c["sender"] = recipient
+            message = current_c.get("message")
+            # If message is not provided in chat_queue, we by default use the last message from the original chat history as the first message in this nested chat (for the first chat in the chat queue).
+            # NOTE: This setting is prone to change.
+            if message is None and i == 0:
+                message = last_msg
+            if callable(message):
+                message = message(recipient, messages, sender, config)
+            # We only run chat that has a valid message. NOTE: This is prone to change depending on applications.
+            if message:
+                current_c["message"] = message
+                chat_to_run.append(current_c)
+        return chat_to_run
+
+    @staticmethod
+    def _process_nested_chat_carryover(
+        chat: dict[str, Any],
+        recipient: Agent,
+        messages: list[dict[str, Any]],
+        sender: Agent,
+        config: Any,
+        trim_n_messages: int = 0,
+    ) -> None:
+        """Process carryover messages for a nested chat (typically for the first chat of a group chat)
+
+        The carryover_config key is a dictionary containing:
+            "summary_method": The method to use to summarise the messages, can be "all", "last_msg", "reflection_with_llm" or a Callable
+            "summary_args": Optional arguments for the summary method
+
+        Supported carryover 'summary_methods' are:
+            "all" - all messages will be incorporated
+            "last_msg" - the last message will be incorporated
+            "reflection_with_llm" - an llm will summarise all the messages and the summary will be incorporated as a single message
+            Callable - a callable with the signature: my_method(agent: ConversableAgent, messages: List[Dict[str, Any]]) -> str
+
+        Args:
+            chat: The chat dictionary containing the carryover configuration
+            recipient: The recipient agent
+            messages: The messages from the parent chat
+            sender: The sender agent
+            config: The LLM configuration
+            trim_n_messages: The number of latest messages to trim from the messages list
+        """
+
+        def concat_carryover(chat_message: str, carryover_message: Union[str, list[dict[str, Any]]]) -> str:
+            """Concatenate the carryover message to the chat message."""
+            prefix = f"{chat_message}\n" if chat_message else ""
+
+            if isinstance(carryover_message, str):
+                content = carryover_message
+            elif isinstance(carryover_message, list):
+                content = "\n".join(
+                    msg["content"] for msg in carryover_message if "content" in msg and msg["content"] is not None
+                )
+            else:
+                raise ValueError("Carryover message must be a string or a list of dictionaries")
+
+            return f"{prefix}Context:\n{content}"
+
+        carryover_config = chat["carryover_config"]
+
+        if "summary_method" not in carryover_config:
+            raise ValueError("Carryover configuration must contain a 'summary_method' key")
+
+        carryover_summary_method = carryover_config["summary_method"]
+        carryover_summary_args = carryover_config.get("summary_args") or {}
+
+        chat_message = ""
+        message = chat.get("message")
+
+        # If the message is a callable, run it and get the result
+        if message:
+            chat_message = message(recipient, messages, sender, config) if callable(message) else message
+
+        # deep copy and trim the latest messages
+        content_messages = copy.deepcopy(messages)
+        content_messages = content_messages[:-trim_n_messages]
+
+        if carryover_summary_method == "all":
+            # Put a string concatenated value of all parent messages into the first message
+            # (e.g. message = <first nested chat message>\nContext: \n<chat message 1>\n<chat message 2>\n...)
+            carry_over_message = concat_carryover(chat_message, content_messages)
+
+        elif carryover_summary_method == "last_msg":
+            # (e.g. message = <first nested chat message>\nContext: \n<last chat message>)
+            carry_over_message = concat_carryover(chat_message, content_messages[-1]["content"])
+
+        elif carryover_summary_method == "reflection_with_llm":
+            # (e.g. message = <first nested chat message>\nContext: \n<llm summary>)
+
+            # Add the messages to the nested chat agent for reflection (we'll clear after reflection)
+            chat["recipient"]._oai_messages[sender] = content_messages
+
+            carry_over_message_llm = ConversableAgent._reflection_with_llm_as_summary(
+                sender=sender,
+                recipient=chat["recipient"],  # Chat recipient LLM config will be used for the reflection
+                summary_args=carryover_summary_args,
+            )
+
+            recipient._oai_messages[sender] = []
+
+            carry_over_message = concat_carryover(chat_message, carry_over_message_llm)
+
+        elif isinstance(carryover_summary_method, Callable):
+            # (e.g. message = <first nested chat message>\nContext: \n<function's return string>)
+            carry_over_message_result = carryover_summary_method(recipient, content_messages, carryover_summary_args)
+
+            carry_over_message = concat_carryover(chat_message, carry_over_message_result)
+
+        chat["message"] = carry_over_message
+
+    @staticmethod
+    def _process_chat_queue_carryover(
+        chat_queue: list[dict[str, Any]],
+        recipient: Agent,
+        messages: Union[str, Callable[..., Any]],
+        sender: Agent,
+        config: Any,
+        trim_messages: int = 2,
+    ) -> tuple[bool, Optional[str]]:
+        """Process carryover configuration for the first chat in the queue.
+
+        Args:
+            chat_queue: List of chat configurations
+            recipient: Receiving agent
+            messages: Chat messages
+            sender: Sending agent
+            config: LLM configuration
+            trim_messages: Number of messages to trim for nested chat carryover (default 2 for nested chat in group chats)
+
+        Returns:
+            Tuple containing:
+                - restore_flag: Whether the original message needs to be restored
+                - original_message: The original message to restore (if any)
+        """
+        restore_chat_queue_message = False
+        original_chat_queue_message = None
+
+        # Carryover configuration allowed on the first chat in the queue only, trim the last two messages specifically for group chat nested chat carryover as these are the messages for the transition to the nested chat agent
+        if len(chat_queue) > 0 and "carryover_config" in chat_queue[0]:
+            if "message" in chat_queue[0]:
+                # As we're updating the message in the nested chat queue, we need to restore it after finishing this nested chat.
+                restore_chat_queue_message = True
+                original_chat_queue_message = chat_queue[0]["message"]
+
+            # TODO Check the trimming required if not a group chat, it may not be 2 because other chats don't have the group transition messages. We may need to add as a carryover_config parameter.
+            ConversableAgent._process_nested_chat_carryover(
+                chat=chat_queue[0],
+                recipient=recipient,
+                messages=messages,
+                sender=sender,
+                config=config,
+                trim_n_messages=trim_messages,
+            )
+
+        return restore_chat_queue_message, original_chat_queue_message
+
+    @staticmethod
+    def _summary_from_nested_chats(
+        chat_queue: list[dict[str, Any]],
+        recipient: Agent,
+        messages: Optional[list[dict[str, Any]]],
+        sender: Agent,
+        config: Any,
+    ) -> tuple[bool, Union[str, None]]:
+        """A simple chat reply function.
+        This function initiate one or a sequence of chats between the "recipient" and the agents in the
+        chat_queue.
+
+        It extracts and returns a summary from the nested chat based on the "summary_method" in each chat in chat_queue.
+
+        The first chat in the queue can contain a 'carryover_config' which is a dictionary that denotes how to carryover messages from the parent chat into the first chat of the nested chats). Only applies to the first chat.
+            e.g.: carryover_summarize_chat_config = {"summary_method": "reflection_with_llm", "summary_args": None}
+            summary_method can be "last_msg", "all", "reflection_with_llm", Callable
+            The Callable signature: my_method(agent: ConversableAgent, messages: List[Dict[str, Any]]) -> str
+            The summary will be concatenated to the message of the first chat in the queue.
+
+        Returns:
+            Tuple[bool, str]: A tuple where the first element indicates the completion of the chat, and the second element contains the summary of the last chat if any chats were initiated.
+        """
+        # Process carryover configuration
+        restore_chat_queue_message, original_chat_queue_message = ConversableAgent._process_chat_queue_carryover(
+            chat_queue, recipient, messages, sender, config
+        )
+
+        chat_to_run = ConversableAgent._get_chats_to_run(chat_queue, recipient, messages, sender, config)
+        if not chat_to_run:
+            return True, None
+        res = initiate_chats(chat_to_run)
+
+        # We need to restore the chat queue message if it has been modified so that it will be the original message for subsequent uses
+        if restore_chat_queue_message:
+            chat_queue[0]["message"] = original_chat_queue_message
+
+        return True, res[-1].summary
+
+    @staticmethod
+    async def _a_summary_from_nested_chats(
+        chat_queue: list[dict[str, Any]],
+        recipient: Agent,
+        messages: Optional[list[dict[str, Any]]],
+        sender: Agent,
+        config: Any,
+    ) -> tuple[bool, Union[str, None]]:
+        """A simple chat reply function.
+        This function initiate one or a sequence of chats between the "recipient" and the agents in the
+        chat_queue.
+
+        It extracts and returns a summary from the nested chat based on the "summary_method" in each chat in chat_queue.
+
+        The first chat in the queue can contain a 'carryover_config' which is a dictionary that denotes how to carryover messages from the parent chat into the first chat of the nested chats). Only applies to the first chat.
+            e.g.: carryover_summarize_chat_config = {"summary_method": "reflection_with_llm", "summary_args": None}
+            summary_method can be "last_msg", "all", "reflection_with_llm", Callable
+            The Callable signature: my_method(agent: ConversableAgent, messages: List[Dict[str, Any]]) -> str
+            The summary will be concatenated to the message of the first chat in the queue.
+
+        Returns:
+            Tuple[bool, str]: A tuple where the first element indicates the completion of the chat, and the second element contains the summary of the last chat if any chats were initiated.
+        """
+        # Process carryover configuration
+        restore_chat_queue_message, original_chat_queue_message = ConversableAgent._process_chat_queue_carryover(
+            chat_queue, recipient, messages, sender, config
+        )
+
+        chat_to_run = ConversableAgent._get_chats_to_run(chat_queue, recipient, messages, sender, config)
+        if not chat_to_run:
+            return True, None
+        res = await a_initiate_chats(chat_to_run)
+        index_of_last_chat = chat_to_run[-1]["chat_id"]
+
+        # We need to restore the chat queue message if it has been modified so that it will be the original message for subsequent uses
+        if restore_chat_queue_message:
+            chat_queue[0]["message"] = original_chat_queue_message
+
+        return True, res[index_of_last_chat].summary
+
+    def register_nested_chats(
+        self,
+        chat_queue: list[dict[str, Any]],
+        trigger: Union[type[Agent], str, Agent, Callable[[Agent], bool], list],
+        reply_func_from_nested_chats: Union[str, Callable[..., Any]] = "summary_from_nested_chats",
+        position: int = 2,
+        use_async: Union[bool, None] = None,
+        **kwargs: Any,
+    ) -> None:
+        """Register a nested chat reply function.
+
+        Args:
+            chat_queue (list): a list of chat objects to be initiated. If use_async is used, then all messages in chat_queue must have a chat-id associated with them.
+            trigger (Agent class, str, Agent instance, callable, or list): refer to `register_reply` for details.
+            reply_func_from_nested_chats (Callable, str): the reply function for the nested chat.
+                The function takes a chat_queue for nested chat, recipient agent, a list of messages, a sender agent and a config as input and returns a reply message.
+                Default to "summary_from_nested_chats", which corresponds to a built-in reply function that get summary from the nested chat_queue.
+                ```python
+                def reply_func_from_nested_chats(
+                    chat_queue: List[Dict],
+                    recipient: ConversableAgent,
+                    messages: Optional[List[Dict]] = None,
+                    sender: Optional[Agent] = None,
+                    config: Optional[Any] = None,
+                ) -> Tuple[bool, Union[str, Dict, None]]:
+                ```
+            position (int): Ref to `register_reply` for details. Default to 2. It means we first check the termination and human reply, then check the registered nested chat reply.
+            use_async: Uses a_initiate_chats internally to start nested chats. If the original chat is initiated with a_initiate_chats, you may set this to true so nested chats do not run in sync.
+            kwargs: Ref to `register_reply` for details.
+        """
+        if use_async:
+            for chat in chat_queue:
+                if chat.get("chat_id") is None:
+                    raise ValueError("chat_id is required for async nested chats")
+
+        if use_async:
+            if reply_func_from_nested_chats == "summary_from_nested_chats":
+                reply_func_from_nested_chats = self._a_summary_from_nested_chats
+            if not callable(reply_func_from_nested_chats) or not inspect.iscoroutinefunction(
+                reply_func_from_nested_chats
+            ):
+                raise ValueError("reply_func_from_nested_chats must be a callable and a coroutine")
+
+            async def wrapped_reply_func(recipient, messages=None, sender=None, config=None):
+                return await reply_func_from_nested_chats(chat_queue, recipient, messages, sender, config)
+
+        else:
+            if reply_func_from_nested_chats == "summary_from_nested_chats":
+                reply_func_from_nested_chats = self._summary_from_nested_chats
+            if not callable(reply_func_from_nested_chats):
+                raise ValueError("reply_func_from_nested_chats must be a callable")
+
+            def wrapped_reply_func(recipient, messages=None, sender=None, config=None):
+                return reply_func_from_nested_chats(chat_queue, recipient, messages, sender, config)
+
+        functools.update_wrapper(wrapped_reply_func, reply_func_from_nested_chats)
+
+        self.register_reply(
+            trigger,
+            wrapped_reply_func,
+            position,
+            kwargs.get("config"),
+            kwargs.get("reset_config"),
+            ignore_async_in_sync_chat=(
+                not use_async if use_async is not None else kwargs.get("ignore_async_in_sync_chat")
+            ),
+        )
+
+    @property
+    def system_message(self) -> str:
+        """Return the system message."""
+        return self._oai_system_message[0]["content"]
+
+    def update_system_message(self, system_message: str) -> None:
+        """Update the system message.
+
+        Args:
+            system_message (str): system message for the ChatCompletion inference.
+        """
+        self._oai_system_message[0]["content"] = system_message
+
+    def update_max_consecutive_auto_reply(self, value: int, sender: Optional[Agent] = None):
+        """Update the maximum number of consecutive auto replies.
+
+        Args:
+            value (int): the maximum number of consecutive auto replies.
+            sender (Agent): when the sender is provided, only update the max_consecutive_auto_reply for that sender.
+        """
+        if sender is None:
+            self._max_consecutive_auto_reply = value
+            for k in self._max_consecutive_auto_reply_dict:
+                self._max_consecutive_auto_reply_dict[k] = value
+        else:
+            self._max_consecutive_auto_reply_dict[sender] = value
+
+    def max_consecutive_auto_reply(self, sender: Optional[Agent] = None) -> int:
+        """The maximum number of consecutive auto replies."""
+        return self._max_consecutive_auto_reply if sender is None else self._max_consecutive_auto_reply_dict[sender]
+
+    @property
+    def chat_messages(self) -> dict[Agent, list[dict[str, Any]]]:
+        """A dictionary of conversations from agent to list of messages."""
+        return self._oai_messages
+
+    def chat_messages_for_summary(self, agent: Agent) -> list[dict[str, Any]]:
+        """A list of messages as a conversation to summarize."""
+        return self._oai_messages[agent]
+
+    def last_message(self, agent: Optional[Agent] = None) -> Optional[dict[str, Any]]:
+        """The last message exchanged with the agent.
+
+        Args:
+            agent (Agent): The agent in the conversation.
+                If None and more than one agent's conversations are found, an error will be raised.
+                If None and only one conversation is found, the last message of the only conversation will be returned.
+
+        Returns:
+            The last message exchanged with the agent.
+        """
+        if agent is None:
+            n_conversations = len(self._oai_messages)
+            if n_conversations == 0:
+                return None
+            if n_conversations == 1:
+                for conversation in self._oai_messages.values():
+                    return conversation[-1]
+            raise ValueError("More than one conversation is found. Please specify the sender to get the last message.")
+        if agent not in self._oai_messages:
+            raise KeyError(
+                f"The agent '{agent.name}' is not present in any conversation. No history available for this agent."
+            )
+        return self._oai_messages[agent][-1]
+
+    @property
+    def use_docker(self) -> Union[bool, str, None]:
+        """Bool value of whether to use docker to execute the code,
+        or str value of the docker image name to use, or None when code execution is disabled.
+        """
+        return None if self._code_execution_config is False else self._code_execution_config.get("use_docker")
+
+    @staticmethod
+    def _message_to_dict(message: Union[dict[str, Any], str]) -> dict:
+        """Convert a message to a dictionary.
+
+        The message can be a string or a dictionary. The string will be put in the "content" field of the new dictionary.
+        """
+        if isinstance(message, str):
+            return {"content": message}
+        elif isinstance(message, dict):
+            return message
+        else:
+            return dict(message)
+
+    @staticmethod
+    def _normalize_name(name):
+        """LLMs sometimes ask functions while ignoring their own format requirements, this function should be used to replace invalid characters with "_".
+
+        Prefer _assert_valid_name for validating user configuration or input
+        """
+        return re.sub(r"[^a-zA-Z0-9_-]", "_", name)[:64]
+
+    @staticmethod
+    def _assert_valid_name(name):
+        """Ensure that configured names are valid, raises ValueError if not.
+
+        For munging LLM responses use _normalize_name to ensure LLM specified names don't break the API.
+        """
+        if not re.match(r"^[a-zA-Z0-9_-]+$", name):
+            raise ValueError(f"Invalid name: {name}. Only letters, numbers, '_' and '-' are allowed.")
+        if len(name) > 64:
+            raise ValueError(f"Invalid name: {name}. Name must be less than 64 characters.")
+        return name
+
+    def _append_oai_message(
+        self, message: Union[dict[str, Any], str], role, conversation_id: Agent, is_sending: bool
+    ) -> bool:
+        """Append a message to the ChatCompletion conversation.
+
+        If the message received is a string, it will be put in the "content" field of the new dictionary.
+        If the message received is a dictionary but does not have any of the three fields "content", "function_call", or "tool_calls",
+            this message is not a valid ChatCompletion message.
+        If only "function_call" or "tool_calls" is provided, "content" will be set to None if not provided, and the role of the message will be forced "assistant".
+
+        Args:
+            message (dict or str): message to be appended to the ChatCompletion conversation.
+            role (str): role of the message, can be "assistant" or "function".
+            conversation_id (Agent): id of the conversation, should be the recipient or sender.
+            is_sending (bool): If the agent (aka self) is sending to the conversation_id agent, otherwise receiving.
+
+        Returns:
+            bool: whether the message is appended to the ChatCompletion conversation.
+        """
+        message = self._message_to_dict(message)
+        # create oai message to be appended to the oai conversation that can be passed to oai directly.
+        oai_message = {
+            k: message[k]
+            for k in ("content", "function_call", "tool_calls", "tool_responses", "tool_call_id", "name", "context")
+            if k in message and message[k] is not None
+        }
+        if "content" not in oai_message:
+            if "function_call" in oai_message or "tool_calls" in oai_message:
+                oai_message["content"] = None  # if only function_call is provided, content will be set to None.
+            else:
+                return False
+
+        if message.get("role") in ["function", "tool"]:
+            oai_message["role"] = message.get("role")
+            if "tool_responses" in oai_message:
+                for tool_response in oai_message["tool_responses"]:
+                    tool_response["content"] = str(tool_response["content"])
+        elif "override_role" in message:
+            # If we have a direction to override the role then set the
+            # role accordingly. Used to customise the role for the
+            # select speaker prompt.
+            oai_message["role"] = message.get("override_role")
+        else:
+            oai_message["role"] = role
+
+        if oai_message.get("function_call", False) or oai_message.get("tool_calls", False):
+            oai_message["role"] = "assistant"  # only messages with role 'assistant' can have a function call.
+        elif "name" not in oai_message:
+            # If we don't have a name field, append it
+            if is_sending:
+                oai_message["name"] = self.name
+            else:
+                oai_message["name"] = conversation_id.name
+
+        self._oai_messages[conversation_id].append(oai_message)
+
+        return True
+
+    def _process_message_before_send(
+        self, message: Union[dict[str, Any], str], recipient: Agent, silent: bool
+    ) -> Union[dict[str, Any], str]:
+        """Process the message before sending it to the recipient."""
+        hook_list = self.hook_lists["process_message_before_send"]
+        for hook in hook_list:
+            message = hook(
+                sender=self, message=message, recipient=recipient, silent=ConversableAgent._is_silent(self, silent)
+            )
+        return message
+
+    def send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ):
+        """Send a message to another agent.
+
+        Args:
+            message (dict or str): message to be sent.
+                The message could contain the following fields:
+                - content (str or List): Required, the content of the message. (Can be None)
+                - function_call (str): the name of the function to be called.
+                - name (str): the name of the function to be called.
+                - role (str): the role of the message, any role that is not "function"
+                    will be modified to "assistant".
+                - context (dict): the context of the message, which will be passed to
+                    [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create).
+                    For example, one agent can send a message A as:
+        ```python
+        {
+            "content": lambda context: context["use_tool_msg"],
+            "context": {"use_tool_msg": "Use tool X if they are relevant."},
+        }
+        ```
+                    Next time, one agent can send a message B with a different "use_tool_msg".
+                    Then the content of message A will be refreshed to the new "use_tool_msg".
+                    So effectively, this provides a way for an agent to send a "link" and modify
+                    the content of the "link" later.
+            recipient (Agent): the recipient of the message.
+            request_reply (bool or None): whether to request a reply from the recipient.
+            silent (bool or None): (Experimental) whether to print the message sent.
+
+        Raises:
+            ValueError: if the message can't be converted into a valid ChatCompletion message.
+        """
+        message = self._process_message_before_send(message, recipient, ConversableAgent._is_silent(self, silent))
+        # When the agent composes and sends the message, the role of the message is "assistant"
+        # unless it's "function".
+        valid = self._append_oai_message(message, "assistant", recipient, is_sending=True)
+        if valid:
+            recipient.receive(message, self, request_reply, silent)
+        else:
+            raise ValueError(
+                "Message can't be converted into a valid ChatCompletion message. Either content or function_call must be provided."
+            )
+
+    async def a_send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ):
+        """(async) Send a message to another agent.
+
+        Args:
+            message (dict or str): message to be sent.
+                The message could contain the following fields:
+                - content (str or List): Required, the content of the message. (Can be None)
+                - function_call (str): the name of the function to be called.
+                - name (str): the name of the function to be called.
+                - role (str): the role of the message, any role that is not "function"
+                    will be modified to "assistant".
+                - context (dict): the context of the message, which will be passed to
+                    [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create).
+                    For example, one agent can send a message A as:
+        ```python
+        {
+            "content": lambda context: context["use_tool_msg"],
+            "context": {"use_tool_msg": "Use tool X if they are relevant."},
+        }
+        ```
+                    Next time, one agent can send a message B with a different "use_tool_msg".
+                    Then the content of message A will be refreshed to the new "use_tool_msg".
+                    So effectively, this provides a way for an agent to send a "link" and modify
+                    the content of the "link" later.
+            recipient (Agent): the recipient of the message.
+            request_reply (bool or None): whether to request a reply from the recipient.
+            silent (bool or None): (Experimental) whether to print the message sent.
+
+        Raises:
+            ValueError: if the message can't be converted into a valid ChatCompletion message.
+        """
+        message = self._process_message_before_send(message, recipient, ConversableAgent._is_silent(self, silent))
+        # When the agent composes and sends the message, the role of the message is "assistant"
+        # unless it's "function".
+        valid = self._append_oai_message(message, "assistant", recipient, is_sending=True)
+        if valid:
+            await recipient.a_receive(message, self, request_reply, silent)
+        else:
+            raise ValueError(
+                "Message can't be converted into a valid ChatCompletion message. Either content or function_call must be provided."
+            )
+
+    def _print_received_message(self, message: Union[dict[str, Any], str], sender: Agent, skip_head: bool = False):
+        message = self._message_to_dict(message)
+        message_model = create_received_event_model(event=message, sender=sender, recipient=self)
+        iostream = IOStream.get_default()
+        # message_model.print(iostream.print)
+        iostream.send(message_model)
+
+    def _process_received_message(self, message: Union[dict[str, Any], str], sender: Agent, silent: bool):
+        # When the agent receives a message, the role of the message is "user". (If 'role' exists and is 'function', it will remain unchanged.)
+        valid = self._append_oai_message(message, "user", sender, is_sending=False)
+        if logging_enabled():
+            log_event(self, "received_message", message=message, sender=sender.name, valid=valid)
+
+        if not valid:
+            raise ValueError(
+                "Received message can't be converted into a valid ChatCompletion message. Either content or function_call must be provided."
+            )
+
+        if not ConversableAgent._is_silent(sender, silent):
+            self._print_received_message(message, sender)
+
+    def receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ):
+        """Receive a message from another agent.
+
+        Once a message is received, this function sends a reply to the sender or stop.
+        The reply can be generated automatically or entered manually by a human.
+
+        Args:
+            message (dict or str): message from the sender. If the type is dict, it may contain the following reserved fields (either content or function_call need to be provided).
+                1. "content": content of the message, can be None.
+                2. "function_call": a dictionary containing the function name and arguments. (deprecated in favor of "tool_calls")
+                3. "tool_calls": a list of dictionaries containing the function name and arguments.
+                4. "role": role of the message, can be "assistant", "user", "function", "tool".
+                    This field is only needed to distinguish between "function" or "assistant"/"user".
+                5. "name": In most cases, this field is not needed. When the role is "function", this field is needed to indicate the function name.
+                6. "context" (dict): the context of the message, which will be passed to
+                    [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create).
+            sender: sender of an Agent instance.
+            request_reply (bool or None): whether a reply is requested from the sender.
+                If None, the value is determined by `self.reply_at_receive[sender]`.
+            silent (bool or None): (Experimental) whether to print the message received.
+
+        Raises:
+            ValueError: if the message can't be converted into a valid ChatCompletion message.
+        """
+        self._process_received_message(message, sender, silent)
+        if request_reply is False or (request_reply is None and self.reply_at_receive[sender] is False):
+            return
+        reply = self.generate_reply(messages=self.chat_messages[sender], sender=sender)
+        if reply is not None:
+            self.send(reply, sender, silent=silent)
+
+    async def a_receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ):
+        """(async) Receive a message from another agent.
+
+        Once a message is received, this function sends a reply to the sender or stop.
+        The reply can be generated automatically or entered manually by a human.
+
+        Args:
+            message (dict or str): message from the sender. If the type is dict, it may contain the following reserved fields (either content or function_call need to be provided).
+                1. "content": content of the message, can be None.
+                2. "function_call": a dictionary containing the function name and arguments. (deprecated in favor of "tool_calls")
+                3. "tool_calls": a list of dictionaries containing the function name and arguments.
+                4. "role": role of the message, can be "assistant", "user", "function".
+                    This field is only needed to distinguish between "function" or "assistant"/"user".
+                5. "name": In most cases, this field is not needed. When the role is "function", this field is needed to indicate the function name.
+                6. "context" (dict): the context of the message, which will be passed to
+                    [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create).
+            sender: sender of an Agent instance.
+            request_reply (bool or None): whether a reply is requested from the sender.
+                If None, the value is determined by `self.reply_at_receive[sender]`.
+            silent (bool or None): (Experimental) whether to print the message received.
+
+        Raises:
+            ValueError: if the message can't be converted into a valid ChatCompletion message.
+        """
+        self._process_received_message(message, sender, silent)
+        if request_reply is False or (request_reply is None and self.reply_at_receive[sender] is False):
+            return
+        reply = await self.a_generate_reply(messages=self.chat_messages[sender], sender=sender)
+        if reply is not None:
+            await self.a_send(reply, sender, silent=silent)
+
+    def _prepare_chat(
+        self,
+        recipient: "ConversableAgent",
+        clear_history: bool,
+        prepare_recipient: bool = True,
+        reply_at_receive: bool = True,
+    ) -> None:
+        self.reset_consecutive_auto_reply_counter(recipient)
+        self.reply_at_receive[recipient] = reply_at_receive
+        if clear_history:
+            self.clear_history(recipient)
+            self._human_input = []
+        if prepare_recipient:
+            recipient._prepare_chat(self, clear_history, False, reply_at_receive)
+
+    def _raise_exception_on_async_reply_functions(self) -> None:
+        """Raise an exception if any async reply functions are registered.
+
+        Raises:
+            RuntimeError: if any async reply functions are registered.
+        """
+        reply_functions = {
+            f["reply_func"] for f in self._reply_func_list if not f.get("ignore_async_in_sync_chat", False)
+        }
+
+        async_reply_functions = [f for f in reply_functions if inspect.iscoroutinefunction(f)]
+        if async_reply_functions:
+            msg = (
+                "Async reply functions can only be used with ConversableAgent.a_initiate_chat(). The following async reply functions are found: "
+                + ", ".join([f.__name__ for f in async_reply_functions])
+            )
+
+            raise RuntimeError(msg)
+
+    def initiate_chat(
+        self,
+        recipient: "ConversableAgent",
+        clear_history: bool = True,
+        silent: Optional[bool] = False,
+        cache: Optional[AbstractCache] = None,
+        max_turns: Optional[int] = None,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+        summary_args: Optional[dict[str, Any]] = {},
+        message: Optional[Union[dict[str, Any], str, Callable[..., Any]]] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        """Initiate a chat with the recipient agent.
+
+        Reset the consecutive auto reply counter.
+        If `clear_history` is True, the chat history with the recipient agent will be cleared.
+
+
+        Args:
+            recipient: the recipient agent.
+            clear_history (bool): whether to clear the chat history with the agent. Default is True.
+            silent (bool or None): (Experimental) whether to print the messages for this conversation. Default is False.
+            cache (AbstractCache or None): the cache client to be used for this conversation. Default is None.
+            max_turns (int or None): the maximum number of turns for the chat between the two agents. One turn means one conversation round trip. Note that this is different from
+                `max_consecutive_auto_reply` which is the maximum number of consecutive auto replies; and it is also different from `max_rounds` in GroupChat which is the maximum number of rounds in a group chat session.
+                If max_turns is set to None, the chat will continue until a termination condition is met. Default is None.
+            summary_method (str or callable): a method to get a summary from the chat. Default is DEFAULT_SUMMARY_METHOD, i.e., "last_msg".
+                Supported strings are "last_msg" and "reflection_with_llm":
+                    - when set to "last_msg", it returns the last message of the dialog as the summary.
+                    - when set to "reflection_with_llm", it returns a summary extracted using an llm client.
+                        `llm_config` must be set in either the recipient or sender.
+
+                A callable summary_method should take the recipient and sender agent in a chat as input and return a string of summary. E.g.,
+
+                ```python
+                def my_summary_method(
+                    sender: ConversableAgent,
+                    recipient: ConversableAgent,
+                    summary_args: dict,
+                ):
+                    return recipient.last_message(sender)["content"]
+                ```
+            summary_args (dict): a dictionary of arguments to be passed to the summary_method.
+                One example key is "summary_prompt", and value is a string of text used to prompt a LLM-based agent (the sender or recipient agent) to reflect
+                on the conversation and extract a summary when summary_method is "reflection_with_llm".
+                The default summary_prompt is DEFAULT_SUMMARY_PROMPT, i.e., "Summarize takeaway from the conversation. Do not add any introductory phrases. If the intended request is NOT properly addressed, please point it out."
+                Another available key is "summary_role", which is the role of the message sent to the agent in charge of summarizing. Default is "system".
+            message (str, dict or Callable): the initial message to be sent to the recipient. Needs to be provided. Otherwise, input() will be called to get the initial message.
+                - If a string or a dict is provided, it will be used as the initial message.        `generate_init_message` is called to generate the initial message for the agent based on this string and the context.
+                    If dict, it may contain the following reserved fields (either content or tool_calls need to be provided).
+
+                        1. "content": content of the message, can be None.
+                        2. "function_call": a dictionary containing the function name and arguments. (deprecated in favor of "tool_calls")
+                        3. "tool_calls": a list of dictionaries containing the function name and arguments.
+                        4. "role": role of the message, can be "assistant", "user", "function".
+                            This field is only needed to distinguish between "function" or "assistant"/"user".
+                        5. "name": In most cases, this field is not needed. When the role is "function", this field is needed to indicate the function name.
+                        6. "context" (dict): the context of the message, which will be passed to
+                            `OpenAIWrapper.create`.
+
+                - If a callable is provided, it will be called to get the initial message in the form of a string or a dict.
+                    If the returned type is dict, it may contain the reserved fields mentioned above.
+
+                    Example of a callable message (returning a string):
+
+                    ```python
+                    def my_message(
+                        sender: ConversableAgent, recipient: ConversableAgent, context: dict
+                    ) -> Union[str, Dict]:
+                        carryover = context.get("carryover", "")
+                        if isinstance(message, list):
+                            carryover = carryover[-1]
+                        final_msg = "Write a blogpost." + "\\nContext: \\n" + carryover
+                        return final_msg
+                    ```
+
+                    Example of a callable message (returning a dict):
+
+                    ```python
+                    def my_message(
+                        sender: ConversableAgent, recipient: ConversableAgent, context: dict
+                    ) -> Union[str, Dict]:
+                        final_msg = {}
+                        carryover = context.get("carryover", "")
+                        if isinstance(message, list):
+                            carryover = carryover[-1]
+                        final_msg["content"] = "Write a blogpost." + "\\nContext: \\n" + carryover
+                        final_msg["context"] = {"prefix": "Today I feel"}
+                        return final_msg
+                    ```
+            **kwargs: any additional information. It has the following reserved fields:
+                - "carryover": a string or a list of string to specify the carryover information to be passed to this chat.
+                    If provided, we will combine this carryover (by attaching a "context: " string and the carryover content after the message content) with the "message" content when generating the initial chat
+                    message in `generate_init_message`.
+                - "verbose": a boolean to specify whether to print the message and carryover in a chat. Default is False.
+
+        Raises:
+            RuntimeError: if any async reply functions are registered and not ignored in sync chat.
+
+        Returns:
+            ChatResult: an ChatResult object.
+        """
+        iostream = IOStream.get_default()
+
+        cache = Cache.get_current_cache(cache)
+        _chat_info = locals().copy()
+        _chat_info["sender"] = self
+        consolidate_chat_info(_chat_info, uniform_sender=self)
+        for agent in [self, recipient]:
+            agent._raise_exception_on_async_reply_functions()
+            agent.previous_cache = agent.client_cache
+            agent.client_cache = cache
+        if isinstance(max_turns, int):
+            self._prepare_chat(recipient, clear_history, reply_at_receive=False)
+            for i in range(max_turns):
+                # check recipient max consecutive auto reply limit
+                if self._consecutive_auto_reply_counter[recipient] >= recipient._max_consecutive_auto_reply:
+                    break
+                if i == 0:
+                    if isinstance(message, Callable):
+                        msg2send = message(_chat_info["sender"], _chat_info["recipient"], kwargs)
+                    else:
+                        msg2send = self.generate_init_message(message, **kwargs)
+                else:
+                    msg2send = self.generate_reply(messages=self.chat_messages[recipient], sender=recipient)
+                if msg2send is None:
+                    break
+                self.send(msg2send, recipient, request_reply=True, silent=silent)
+
+            else:  # No breaks in the for loop, so we have reached max turns
+                iostream.send(TerminationEvent(termination_reason=f"Maximum turns ({max_turns}) reached"))
+        else:
+            self._prepare_chat(recipient, clear_history)
+            if isinstance(message, Callable):
+                msg2send = message(_chat_info["sender"], _chat_info["recipient"], kwargs)
+            else:
+                msg2send = self.generate_init_message(message, **kwargs)
+            self.send(msg2send, recipient, silent=silent)
+        summary = self._summarize_chat(
+            summary_method,
+            summary_args,
+            recipient,
+            cache=cache,
+        )
+        for agent in [self, recipient]:
+            agent.client_cache = agent.previous_cache
+            agent.previous_cache = None
+        chat_result = ChatResult(
+            chat_history=self.chat_messages[recipient],
+            summary=summary,
+            cost=gather_usage_summary([self, recipient]),
+            human_input=self._human_input,
+        )
+        return chat_result
+
+    def run(
+        self,
+        recipient: Optional["ConversableAgent"] = None,
+        clear_history: bool = True,
+        silent: Optional[bool] = False,
+        cache: Optional[AbstractCache] = None,
+        max_turns: Optional[int] = None,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+        summary_args: Optional[dict[str, Any]] = {},
+        message: Optional[Union[dict[str, Any], str, Callable[..., Any]]] = None,
+        executor_kwargs: Optional[dict[str, Any]] = None,
+        tools: Optional[Union[Tool, Iterable[Tool]]] = None,
+        user_input: Optional[bool] = False,
+        msg_to: Optional[str] = "agent",
+        **kwargs: Any,
+    ) -> RunResponseProtocol:
+        iostream = ThreadIOStream()
+        agents = [self, recipient] if recipient else [self]
+        response = RunResponse(iostream, agents=agents)
+
+        if recipient is None:
+
+            def initiate_chat(
+                self=self,
+                iostream: ThreadIOStream = iostream,
+                response: RunResponse = response,
+            ) -> None:
+                with (
+                    IOStream.set_default(iostream),
+                    self._create_or_get_executor(
+                        executor_kwargs=executor_kwargs,
+                        tools=tools,
+                        agent_name="user",
+                        agent_human_input_mode="ALWAYS" if user_input else "NEVER",
+                    ) as executor,
+                ):
+                    try:
+                        if msg_to == "agent":
+                            chat_result = executor.initiate_chat(
+                                self,
+                                message=message,
+                                clear_history=clear_history,
+                                max_turns=max_turns,
+                                summary_method=summary_method,
+                            )
+                        else:
+                            chat_result = self.initiate_chat(
+                                executor,
+                                message=message,
+                                clear_history=clear_history,
+                                max_turns=max_turns,
+                                summary_method=summary_method,
+                            )
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_result.chat_history,
+                                summary=chat_result.summary,
+                                cost=chat_result.cost,
+                                last_speaker=self.name,
+                            )
+                        )
+                    except Exception as e:
+                        response.iostream.send(ErrorEvent(error=e))
+
+        else:
+
+            def initiate_chat(
+                self=self,
+                iostream: ThreadIOStream = iostream,
+                response: RunResponse = response,
+            ) -> None:
+                with IOStream.set_default(iostream):  # type: ignore[arg-type]
+                    try:
+                        chat_result = self.initiate_chat(
+                            recipient,
+                            clear_history=clear_history,
+                            silent=silent,
+                            cache=cache,
+                            max_turns=max_turns,
+                            summary_method=summary_method,
+                            summary_args=summary_args,
+                            message=message,
+                            **kwargs,
+                        )
+
+                        response._summary = chat_result.summary
+                        response._messages = chat_result.chat_history
+
+                        _last_speaker = recipient if chat_result.chat_history[-1]["name"] == recipient.name else self
+                        if hasattr(recipient, "last_speaker"):
+                            _last_speaker = recipient.last_speaker
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_result.chat_history,
+                                summary=chat_result.summary,
+                                cost=chat_result.cost,
+                                last_speaker=_last_speaker.name,
+                            )
+                        )
+                    except Exception as e:
+                        response.iostream.send(ErrorEvent(error=e))
+
+        threading.Thread(
+            target=initiate_chat,
+        ).start()
+
+        return response
+
+    async def a_initiate_chat(
+        self,
+        recipient: "ConversableAgent",
+        clear_history: bool = True,
+        silent: Optional[bool] = False,
+        cache: Optional[AbstractCache] = None,
+        max_turns: Optional[int] = None,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+        summary_args: Optional[dict[str, Any]] = {},
+        message: Optional[Union[str, Callable[..., Any]]] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        """(async) Initiate a chat with the recipient agent.
+
+        Reset the consecutive auto reply counter.
+        If `clear_history` is True, the chat history with the recipient agent will be cleared.
+        `a_generate_init_message` is called to generate the initial message for the agent.
+
+        Args: Please refer to `initiate_chat`.
+
+        Returns:
+            ChatResult: an ChatResult object.
+        """
+        iostream = IOStream.get_default()
+
+        _chat_info = locals().copy()
+        _chat_info["sender"] = self
+        consolidate_chat_info(_chat_info, uniform_sender=self)
+        for agent in [self, recipient]:
+            agent.previous_cache = agent.client_cache
+            agent.client_cache = cache
+        if isinstance(max_turns, int):
+            self._prepare_chat(recipient, clear_history, reply_at_receive=False)
+            for _ in range(max_turns):
+                if _ == 0:
+                    if isinstance(message, Callable):
+                        msg2send = message(_chat_info["sender"], _chat_info["recipient"], kwargs)
+                    else:
+                        msg2send = await self.a_generate_init_message(message, **kwargs)
+                else:
+                    msg2send = await self.a_generate_reply(messages=self.chat_messages[recipient], sender=recipient)
+                if msg2send is None:
+                    break
+                await self.a_send(msg2send, recipient, request_reply=True, silent=silent)
+            else:  # No breaks in the for loop, so we have reached max turns
+                iostream.send(TerminationEvent(termination_reason=f"Maximum turns ({max_turns}) reached"))
+        else:
+            self._prepare_chat(recipient, clear_history)
+            if isinstance(message, Callable):
+                msg2send = message(_chat_info["sender"], _chat_info["recipient"], kwargs)
+            else:
+                msg2send = await self.a_generate_init_message(message, **kwargs)
+            await self.a_send(msg2send, recipient, silent=silent)
+        summary = self._summarize_chat(
+            summary_method,
+            summary_args,
+            recipient,
+            cache=cache,
+        )
+        for agent in [self, recipient]:
+            agent.client_cache = agent.previous_cache
+            agent.previous_cache = None
+        chat_result = ChatResult(
+            chat_history=self.chat_messages[recipient],
+            summary=summary,
+            cost=gather_usage_summary([self, recipient]),
+            human_input=self._human_input,
+        )
+        return chat_result
+
+    async def a_run(
+        self,
+        recipient: Optional["ConversableAgent"] = None,
+        clear_history: bool = True,
+        silent: Optional[bool] = False,
+        cache: Optional[AbstractCache] = None,
+        max_turns: Optional[int] = None,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+        summary_args: Optional[dict[str, Any]] = {},
+        message: Optional[Union[dict[str, Any], str, Callable[..., Any]]] = None,
+        executor_kwargs: Optional[dict[str, Any]] = None,
+        tools: Optional[Union[Tool, Iterable[Tool]]] = None,
+        user_input: Optional[bool] = False,
+        msg_to: Optional[str] = "agent",
+        **kwargs: Any,
+    ) -> AsyncRunResponseProtocol:
+        iostream = AsyncThreadIOStream()
+        agents = [self, recipient] if recipient else [self]
+        response = AsyncRunResponse(iostream, agents=agents)
+
+        if recipient is None:
+
+            async def initiate_chat(
+                self=self,
+                iostream: AsyncThreadIOStream = iostream,
+                response: AsyncRunResponse = response,
+            ) -> None:
+                with (
+                    IOStream.set_default(iostream),
+                    self._create_or_get_executor(
+                        executor_kwargs=executor_kwargs,
+                        tools=tools,
+                        agent_name="user",
+                        agent_human_input_mode="ALWAYS" if user_input else "NEVER",
+                    ) as executor,
+                ):
+                    try:
+                        if msg_to == "agent":
+                            chat_result = await executor.a_initiate_chat(
+                                self,
+                                message=message,
+                                clear_history=clear_history,
+                                max_turns=max_turns,
+                                summary_method=summary_method,
+                            )
+                        else:
+                            chat_result = await self.a_initiate_chat(
+                                executor,
+                                message=message,
+                                clear_history=clear_history,
+                                max_turns=max_turns,
+                                summary_method=summary_method,
+                            )
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_result.chat_history,
+                                summary=chat_result.summary,
+                                cost=chat_result.cost,
+                                last_speaker=self.name,
+                            )
+                        )
+                    except Exception as e:
+                        response.iostream.send(ErrorEvent(error=e))
+
+        else:
+
+            async def initiate_chat(
+                self=self,
+                iostream: AsyncThreadIOStream = iostream,
+                response: AsyncRunResponse = response,
+            ) -> None:
+                with IOStream.set_default(iostream):  # type: ignore[arg-type]
+                    try:
+                        chat_result = await self.a_initiate_chat(
+                            recipient,
+                            clear_history=clear_history,
+                            silent=silent,
+                            cache=cache,
+                            max_turns=max_turns,
+                            summary_method=summary_method,
+                            summary_args=summary_args,
+                            message=message,
+                            **kwargs,
+                        )
+
+                        last_speaker = recipient if chat_result.chat_history[-1]["name"] == recipient.name else self
+                        if hasattr(recipient, "last_speaker"):
+                            last_speaker = recipient.last_speaker
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_result.chat_history,
+                                summary=chat_result.summary,
+                                cost=chat_result.cost,
+                                last_speaker=last_speaker.name,
+                            )
+                        )
+
+                    except Exception as e:
+                        response.iostream.send(ErrorEvent(error=e))
+
+        asyncio.create_task(initiate_chat())
+
+        return response
+
+    def _summarize_chat(
+        self,
+        summary_method,
+        summary_args,
+        recipient: Optional[Agent] = None,
+        cache: Optional[AbstractCache] = None,
+    ) -> str:
+        """Get a chat summary from an agent participating in a chat.
+
+        Args:
+            summary_method (str or callable): the summary_method to get the summary.
+                The callable summary_method should take the recipient and sender agent in a chat as input and return a string of summary. E.g,
+                ```python
+                def my_summary_method(
+                    sender: ConversableAgent,
+                    recipient: ConversableAgent,
+                    summary_args: dict,
+                ):
+                    return recipient.last_message(sender)["content"]
+                ```
+            summary_args (dict): a dictionary of arguments to be passed to the summary_method.
+            recipient: the recipient agent in a chat.
+            cache: the cache client to be used for this conversation. When provided,
+                the cache will be used to store and retrieve LLM responses when generating
+                summaries, which can improve performance and reduce API costs for
+                repetitive summary requests. The cache is passed to the summary_method
+                via summary_args['cache'].
+
+        Returns:
+            str: a chat summary from the agent.
+        """
+        summary = ""
+        if summary_method is None:
+            return summary
+        if "cache" not in summary_args:
+            summary_args["cache"] = cache
+        if summary_method == "reflection_with_llm":
+            summary_method = self._reflection_with_llm_as_summary
+        elif summary_method == "last_msg":
+            summary_method = self._last_msg_as_summary
+
+        if isinstance(summary_method, Callable):
+            summary = summary_method(self, recipient, summary_args)
+        else:
+            raise ValueError(
+                "If not None, the summary_method must be a string from [`reflection_with_llm`, `last_msg`] or a callable."
+            )
+        return summary
+
+    @staticmethod
+    def _last_msg_as_summary(sender, recipient, summary_args) -> str:
+        """Get a chat summary from the last message of the recipient."""
+        summary = ""
+        try:
+            content = recipient.last_message(sender)["content"]
+            if isinstance(content, str):
+                summary = content.replace("TERMINATE", "")
+            elif isinstance(content, list):
+                # Remove the `TERMINATE` word in the content list.
+                summary = "\n".join(
+                    x["text"].replace("TERMINATE", "") for x in content if isinstance(x, dict) and "text" in x
+                )
+        except (IndexError, AttributeError) as e:
+            warnings.warn(f"Cannot extract summary using last_msg: {e}. Using an empty str as summary.", UserWarning)
+        return summary
+
+    @staticmethod
+    def _reflection_with_llm_as_summary(sender, recipient, summary_args):
+        prompt = summary_args.get("summary_prompt")
+        prompt = ConversableAgent.DEFAULT_SUMMARY_PROMPT if prompt is None else prompt
+        if not isinstance(prompt, str):
+            raise ValueError("The summary_prompt must be a string.")
+        msg_list = recipient.chat_messages_for_summary(sender)
+        agent = sender if recipient is None else recipient
+        role = summary_args.get("summary_role", None)
+        if role and not isinstance(role, str):
+            raise ValueError("The summary_role in summary_arg must be a string.")
+        try:
+            summary = sender._reflection_with_llm(
+                prompt, msg_list, llm_agent=agent, cache=summary_args.get("cache"), role=role
+            )
+        except Exception as e:
+            warnings.warn(
+                f"Cannot extract summary using reflection_with_llm: {e}. Using an empty str as summary.", UserWarning
+            )
+            summary = ""
+        return summary
+
+    def _reflection_with_llm(
+        self,
+        prompt,
+        messages,
+        llm_agent: Optional[Agent] = None,
+        cache: Optional[AbstractCache] = None,
+        role: Union[str, None] = None,
+    ) -> str:
+        """Get a chat summary using reflection with an llm client based on the conversation history.
+
+        Args:
+            prompt (str): The prompt (in this method it is used as system prompt) used to get the summary.
+            messages (list): The messages generated as part of a chat conversation.
+            llm_agent: the agent with an llm client.
+            cache (AbstractCache or None): the cache client to be used for this conversation.
+            role (str): the role of the message, usually "system" or "user". Default is "system".
+        """
+        if not role:
+            role = "system"
+
+        system_msg = [
+            {
+                "role": role,
+                "content": prompt,
+            }
+        ]
+
+        messages = messages + system_msg
+        if llm_agent and llm_agent.client is not None:
+            llm_client = llm_agent.client
+        elif self.client is not None:
+            llm_client = self.client
+        else:
+            raise ValueError("No OpenAIWrapper client is found.")
+        response = self._generate_oai_reply_from_client(llm_client=llm_client, messages=messages, cache=cache)
+        return response
+
+    def _check_chat_queue_for_sender(self, chat_queue: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Check the chat queue and add the "sender" key if it's missing.
+
+        Args:
+            chat_queue (List[Dict[str, Any]]): A list of dictionaries containing chat information.
+
+        Returns:
+            List[Dict[str, Any]]: A new list of dictionaries with the "sender" key added if it was missing.
+        """
+        chat_queue_with_sender = []
+        for chat_info in chat_queue:
+            if chat_info.get("sender") is None:
+                chat_info["sender"] = self
+            chat_queue_with_sender.append(chat_info)
+        return chat_queue_with_sender
+
+    def initiate_chats(self, chat_queue: list[dict[str, Any]]) -> list[ChatResult]:
+        """(Experimental) Initiate chats with multiple agents.
+
+        Args:
+            chat_queue (List[Dict]): a list of dictionaries containing the information of the chats.
+                Each dictionary should contain the input arguments for [`initiate_chat`](#initiate-chat)
+
+        Returns: a list of ChatResult objects corresponding to the finished chats in the chat_queue.
+        """
+        _chat_queue = self._check_chat_queue_for_sender(chat_queue)
+        self._finished_chats = initiate_chats(_chat_queue)
+
+        return self._finished_chats
+
+    def sequential_run(
+        self,
+        chat_queue: list[dict[str, Any]],
+    ) -> list[RunResponseProtocol]:
+        """(Experimental) Initiate chats with multiple agents sequentially.
+
+        Args:
+            chat_queue (List[Dict]): a list of dictionaries containing the information of the chats.
+                Each dictionary should contain the input arguments for [`initiate_chat`](#initiate-chat)
+
+        Returns: a list of ChatResult objects corresponding to the finished chats in the chat_queue.
+        """
+        iostreams = [ThreadIOStream() for _ in range(len(chat_queue))]
+        # todo: add agents
+        responses = [RunResponse(iostream, agents=[]) for iostream in iostreams]
+
+        def _initiate_chats(
+            iostreams: list[ThreadIOStream] = iostreams,
+            responses: list[RunResponseProtocol] = responses,
+        ) -> None:
+            response = responses[0]
+            try:
+                _chat_queue = self._check_chat_queue_for_sender(chat_queue)
+
+                consolidate_chat_info(_chat_queue)
+                _validate_recipients(_chat_queue)
+                finished_chats = []
+                for chat_info, response, iostream in zip(_chat_queue, responses, iostreams):
+                    with IOStream.set_default(iostream):
+                        _chat_carryover = chat_info.get("carryover", [])
+                        finished_chat_indexes_to_exclude_from_carryover = chat_info.get(
+                            "finished_chat_indexes_to_exclude_from_carryover", []
+                        )
+
+                        if isinstance(_chat_carryover, str):
+                            _chat_carryover = [_chat_carryover]
+                        chat_info["carryover"] = _chat_carryover + [
+                            r.summary
+                            for i, r in enumerate(finished_chats)
+                            if i not in finished_chat_indexes_to_exclude_from_carryover
+                        ]
+
+                        if not chat_info.get("silent", False):
+                            IOStream.get_default().send(PostCarryoverProcessingEvent(chat_info=chat_info))
+
+                        sender = chat_info["sender"]
+                        chat_res = sender.initiate_chat(**chat_info)
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_res.chat_history,
+                                summary=chat_res.summary,
+                                cost=chat_res.cost,
+                                last_speaker=(self if chat_res.chat_history[-1]["name"] == self.name else sender).name,
+                            )
+                        )
+
+                        finished_chats.append(chat_res)
+            except Exception as e:
+                response.iostream.send(ErrorEvent(error=e))
+
+        threading.Thread(target=_initiate_chats).start()
+
+        return responses
+
+    async def a_initiate_chats(self, chat_queue: list[dict[str, Any]]) -> dict[int, ChatResult]:
+        _chat_queue = self._check_chat_queue_for_sender(chat_queue)
+        self._finished_chats = await a_initiate_chats(_chat_queue)
+        return self._finished_chats
+
+    async def a_sequential_run(
+        self,
+        chat_queue: list[dict[str, Any]],
+    ) -> list[AsyncRunResponseProtocol]:
+        """(Experimental) Initiate chats with multiple agents sequentially.
+
+        Args:
+            chat_queue (List[Dict]): a list of dictionaries containing the information of the chats.
+                Each dictionary should contain the input arguments for [`initiate_chat`](#initiate-chat)
+
+        Returns: a list of ChatResult objects corresponding to the finished chats in the chat_queue.
+        """
+        iostreams = [AsyncThreadIOStream() for _ in range(len(chat_queue))]
+        # todo: add agents
+        responses = [AsyncRunResponse(iostream, agents=[]) for iostream in iostreams]
+
+        async def _a_initiate_chats(
+            iostreams: list[AsyncThreadIOStream] = iostreams,
+            responses: list[AsyncRunResponseProtocol] = responses,
+        ) -> None:
+            response = responses[0]
+            try:
+                _chat_queue = self._check_chat_queue_for_sender(chat_queue)
+
+                consolidate_chat_info(_chat_queue)
+                _validate_recipients(_chat_queue)
+                finished_chats = []
+                for chat_info, response, iostream in zip(_chat_queue, responses, iostreams):
+                    with IOStream.set_default(iostream):
+                        _chat_carryover = chat_info.get("carryover", [])
+                        finished_chat_indexes_to_exclude_from_carryover = chat_info.get(
+                            "finished_chat_indexes_to_exclude_from_carryover", []
+                        )
+
+                        if isinstance(_chat_carryover, str):
+                            _chat_carryover = [_chat_carryover]
+                        chat_info["carryover"] = _chat_carryover + [
+                            r.summary
+                            for i, r in enumerate(finished_chats)
+                            if i not in finished_chat_indexes_to_exclude_from_carryover
+                        ]
+
+                        if not chat_info.get("silent", False):
+                            IOStream.get_default().send(PostCarryoverProcessingEvent(chat_info=chat_info))
+
+                        sender = chat_info["sender"]
+                        chat_res = await sender.a_initiate_chat(**chat_info)
+
+                        IOStream.get_default().send(
+                            RunCompletionEvent(
+                                history=chat_res.chat_history,
+                                summary=chat_res.summary,
+                                cost=chat_res.cost,
+                                last_speaker=(self if chat_res.chat_history[-1]["name"] == self.name else sender).name,
+                            )
+                        )
+
+                        finished_chats.append(chat_res)
+
+            except Exception as e:
+                response.iostream.send(ErrorEvent(error=e))
+
+        asyncio.create_task(_a_initiate_chats())
+
+        return responses
+
+    def get_chat_results(self, chat_index: Optional[int] = None) -> Union[list[ChatResult], ChatResult]:
+        """A summary from the finished chats of particular agents."""
+        if chat_index is not None:
+            return self._finished_chats[chat_index]
+        else:
+            return self._finished_chats
+
+    def reset(self) -> None:
+        """Reset the agent."""
+        self.clear_history()
+        self.reset_consecutive_auto_reply_counter()
+        self.stop_reply_at_receive()
+        if self.client is not None:
+            self.client.clear_usage_summary()
+        for reply_func_tuple in self._reply_func_list:
+            if reply_func_tuple["reset_config"] is not None:
+                reply_func_tuple["reset_config"](reply_func_tuple["config"])
+            else:
+                reply_func_tuple["config"] = copy.copy(reply_func_tuple["init_config"])
+
+    def stop_reply_at_receive(self, sender: Optional[Agent] = None):
+        """Reset the reply_at_receive of the sender."""
+        if sender is None:
+            self.reply_at_receive.clear()
+        else:
+            self.reply_at_receive[sender] = False
+
+    def reset_consecutive_auto_reply_counter(self, sender: Optional[Agent] = None):
+        """Reset the consecutive_auto_reply_counter of the sender."""
+        if sender is None:
+            self._consecutive_auto_reply_counter.clear()
+        else:
+            self._consecutive_auto_reply_counter[sender] = 0
+
+    def clear_history(self, recipient: Optional[Agent] = None, nr_messages_to_preserve: Optional[int] = None):
+        """Clear the chat history of the agent.
+
+        Args:
+            recipient: the agent with whom the chat history to clear. If None, clear the chat history with all agents.
+            nr_messages_to_preserve: the number of newest messages to preserve in the chat history.
+        """
+        iostream = IOStream.get_default()
+        if recipient is None:
+            no_messages_preserved = 0
+            if nr_messages_to_preserve:
+                for key in self._oai_messages:
+                    nr_messages_to_preserve_internal = nr_messages_to_preserve
+                    # if breaking history between function call and function response, save function call message
+                    # additionally, otherwise openai will return error
+                    first_msg_to_save = self._oai_messages[key][-nr_messages_to_preserve_internal]
+                    if "tool_responses" in first_msg_to_save:
+                        nr_messages_to_preserve_internal += 1
+                        # clear_conversable_agent_history.print_preserving_message(iostream.print)
+                        no_messages_preserved += 1
+                    # Remove messages from history except last `nr_messages_to_preserve` messages.
+                    self._oai_messages[key] = self._oai_messages[key][-nr_messages_to_preserve_internal:]
+                iostream.send(ClearConversableAgentHistoryEvent(agent=self, no_events_preserved=no_messages_preserved))
+            else:
+                self._oai_messages.clear()
+        else:
+            self._oai_messages[recipient].clear()
+            # clear_conversable_agent_history.print_warning(iostream.print)
+            if nr_messages_to_preserve:
+                iostream.send(ClearConversableAgentHistoryWarningEvent(recipient=self))
+
+    def generate_oai_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[OpenAIWrapper] = None,
+    ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        """Generate a reply using autogen.oai."""
+        client = self.client if config is None else config
+        if client is None:
+            return False, None
+        if messages is None:
+            messages = self._oai_messages[sender]
+        extracted_response = self._generate_oai_reply_from_client(
+            client, self._oai_system_message + messages, self.client_cache
+        )
+        return (False, None) if extracted_response is None else (True, extracted_response)
+
+    def _generate_oai_reply_from_client(self, llm_client, messages, cache) -> Optional[Union[str, dict[str, Any]]]:
+        # unroll tool_responses
+        all_messages = []
+        for message in messages:
+            tool_responses = message.get("tool_responses", [])
+            if tool_responses:
+                all_messages += tool_responses
+                # tool role on the parent message means the content is just concatenation of all of the tool_responses
+                if message.get("role") != "tool":
+                    all_messages.append({key: message[key] for key in message if key != "tool_responses"})
+            else:
+                all_messages.append(message)
+
+        # TODO: #1143 handle token limit exceeded error
+        response = llm_client.create(
+            context=messages[-1].pop("context", None),
+            messages=all_messages,
+            cache=cache,
+            agent=self,
+        )
+        extracted_response = llm_client.extract_text_or_completion_object(response)[0]
+
+        if extracted_response is None:
+            warnings.warn(f"Extracted_response from {response} is None.", UserWarning)
+            return None
+        # ensure function and tool calls will be accepted when sent back to the LLM
+        if not isinstance(extracted_response, str) and hasattr(extracted_response, "model_dump"):
+            extracted_response = extracted_response.model_dump()
+        if isinstance(extracted_response, dict):
+            if extracted_response.get("function_call"):
+                extracted_response["function_call"]["name"] = self._normalize_name(
+                    extracted_response["function_call"]["name"]
+                )
+            for tool_call in extracted_response.get("tool_calls") or []:
+                tool_call["function"]["name"] = self._normalize_name(tool_call["function"]["name"])
+                # Remove id and type if they are not present.
+                # This is to make the tool call object compatible with Mistral API.
+                if tool_call.get("id") is None:
+                    tool_call.pop("id")
+                if tool_call.get("type") is None:
+                    tool_call.pop("type")
+        return extracted_response
+
+    async def a_generate_oai_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        """Generate a reply using autogen.oai asynchronously."""
+        iostream = IOStream.get_default()
+
+        def _generate_oai_reply(
+            self, iostream: IOStream, *args: Any, **kwargs: Any
+        ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+            with IOStream.set_default(iostream):
+                return self.generate_oai_reply(*args, **kwargs)
+
+        return await asyncio.get_event_loop().run_in_executor(
+            None,
+            functools.partial(
+                _generate_oai_reply, self=self, iostream=iostream, messages=messages, sender=sender, config=config
+            ),
+        )
+
+    def _generate_code_execution_reply_using_executor(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Union[dict[str, Any], Literal[False]]] = None,
+    ):
+        """Generate a reply using code executor."""
+        iostream = IOStream.get_default()
+
+        if config is not None:
+            raise ValueError("config is not supported for _generate_code_execution_reply_using_executor.")
+        if self._code_execution_config is False:
+            return False, None
+        if messages is None:
+            messages = self._oai_messages[sender]
+        last_n_messages = self._code_execution_config.get("last_n_messages", "auto")
+
+        if not (isinstance(last_n_messages, (int, float)) and last_n_messages >= 0) and last_n_messages != "auto":
+            raise ValueError("last_n_messages must be either a non-negative integer, or the string 'auto'.")
+
+        num_messages_to_scan = last_n_messages
+        if last_n_messages == "auto":
+            # Find when the agent last spoke
+            num_messages_to_scan = 0
+            for message in reversed(messages):
+                if "role" not in message or message["role"] != "user":
+                    break
+                else:
+                    num_messages_to_scan += 1
+        num_messages_to_scan = min(len(messages), num_messages_to_scan)
+        messages_to_scan = messages[-num_messages_to_scan:]
+
+        # iterate through the last n messages in reverse
+        # if code blocks are found, execute the code blocks and return the output
+        # if no code blocks are found, continue
+        for message in reversed(messages_to_scan):
+            if not message["content"]:
+                continue
+            code_blocks = self._code_executor.code_extractor.extract_code_blocks(message["content"])
+            if len(code_blocks) == 0:
+                continue
+
+            iostream.send(GenerateCodeExecutionReplyEvent(code_blocks=code_blocks, sender=sender, recipient=self))
+
+            # found code blocks, execute code.
+            code_result = self._code_executor.execute_code_blocks(code_blocks)
+            exitcode2str = "execution succeeded" if code_result.exit_code == 0 else "execution failed"
+            return True, f"exitcode: {code_result.exit_code} ({exitcode2str})\nCode output: {code_result.output}"
+
+        return False, None
+
+    def generate_code_execution_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Union[dict[str, Any], Literal[False]]] = None,
+    ):
+        """Generate a reply using code execution."""
+        code_execution_config = config if config is not None else self._code_execution_config
+        if code_execution_config is False:
+            return False, None
+        if messages is None:
+            messages = self._oai_messages[sender]
+        last_n_messages = code_execution_config.pop("last_n_messages", "auto")
+
+        if not (isinstance(last_n_messages, (int, float)) and last_n_messages >= 0) and last_n_messages != "auto":
+            raise ValueError("last_n_messages must be either a non-negative integer, or the string 'auto'.")
+
+        messages_to_scan = last_n_messages
+        if last_n_messages == "auto":
+            # Find when the agent last spoke
+            messages_to_scan = 0
+            for i in range(len(messages)):
+                message = messages[-(i + 1)]
+                if "role" not in message or message["role"] != "user":
+                    break
+                else:
+                    messages_to_scan += 1
+
+        # iterate through the last n messages in reverse
+        # if code blocks are found, execute the code blocks and return the output
+        # if no code blocks are found, continue
+        for i in range(min(len(messages), messages_to_scan)):
+            message = messages[-(i + 1)]
+            if not message["content"]:
+                continue
+            code_blocks = extract_code(message["content"])
+            if len(code_blocks) == 1 and code_blocks[0][0] == UNKNOWN:
+                continue
+
+            # found code blocks, execute code and push "last_n_messages" back
+            exitcode, logs = self.execute_code_blocks(code_blocks)
+            code_execution_config["last_n_messages"] = last_n_messages
+            exitcode2str = "execution succeeded" if exitcode == 0 else "execution failed"
+            return True, f"exitcode: {exitcode} ({exitcode2str})\nCode output: {logs}"
+
+        # no code blocks are found, push last_n_messages back and return.
+        code_execution_config["last_n_messages"] = last_n_messages
+
+        return False, None
+
+    def _run_async_in_thread(self, coro):
+        """Run an async coroutine in a separate thread with its own event loop."""
+        result = {}
+
+        def runner():
+            loop = asyncio.new_event_loop()
+            asyncio.set_event_loop(loop)
+            result["value"] = loop.run_until_complete(coro)
+            loop.close()
+
+        t = threading.Thread(target=runner)
+        t.start()
+        t.join()
+        return result["value"]
+
+    def generate_function_call_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[dict[str, Any]]]:
+        """Generate a reply using function call.
+
+        "function_call" replaced by "tool_calls" as of [OpenAI API v1.1.0](https://github.com/openai/openai-python/releases/tag/v1.1.0)
+        See https://platform.openai.com/docs/api-reference/chat/create#chat-create-functions
+        """
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        if message.get("function_call"):
+            call_id = message.get("id", None)
+            func_call = message["function_call"]
+            func = self._function_map.get(func_call.get("name", None), None)
+            if inspect.iscoroutinefunction(func):
+                coro = self.a_execute_function(func_call, call_id=call_id)
+                _, func_return = self._run_async_in_thread(coro)
+            else:
+                _, func_return = self.execute_function(message["function_call"], call_id=call_id)
+            return True, func_return
+        return False, None
+
+    async def a_generate_function_call_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[dict[str, Any]]]:
+        """Generate a reply using async function call.
+
+        "function_call" replaced by "tool_calls" as of [OpenAI API v1.1.0](https://github.com/openai/openai-python/releases/tag/v1.1.0)
+        See https://platform.openai.com/docs/api-reference/chat/create#chat-create-functions
+        """
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        if "function_call" in message:
+            call_id = message.get("id", None)
+            func_call = message["function_call"]
+            func_name = func_call.get("name", "")
+            func = self._function_map.get(func_name, None)
+            if func and inspect.iscoroutinefunction(func):
+                _, func_return = await self.a_execute_function(func_call, call_id=call_id)
+            else:
+                _, func_return = self.execute_function(func_call, call_id=call_id)
+            return True, func_return
+
+        return False, None
+
+    def _str_for_tool_response(self, tool_response):
+        return str(tool_response.get("content", ""))
+
+    def generate_tool_calls_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[dict[str, Any]]]:
+        """Generate a reply using tool call."""
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        tool_returns = []
+        for tool_call in message.get("tool_calls", []):
+            function_call = tool_call.get("function", {})
+            tool_call_id = tool_call.get("id", None)
+            func = self._function_map.get(function_call.get("name", None), None)
+            if inspect.iscoroutinefunction(func):
+                coro = self.a_execute_function(function_call, call_id=tool_call_id)
+                _, func_return = self._run_async_in_thread(coro)
+            else:
+                _, func_return = self.execute_function(function_call, call_id=tool_call_id)
+            content = func_return.get("content", "")
+            if content is None:
+                content = ""
+
+            if tool_call_id is not None:
+                tool_call_response = {
+                    "tool_call_id": tool_call_id,
+                    "role": "tool",
+                    "content": content,
+                }
+            else:
+                # Do not include tool_call_id if it is not present.
+                # This is to make the tool call object compatible with Mistral API.
+                tool_call_response = {
+                    "role": "tool",
+                    "content": content,
+                }
+            tool_returns.append(tool_call_response)
+        if tool_returns:
+            return True, {
+                "role": "tool",
+                "tool_responses": tool_returns,
+                "content": "\n\n".join([self._str_for_tool_response(tool_return) for tool_return in tool_returns]),
+            }
+        return False, None
+
+    async def _a_execute_tool_call(self, tool_call):
+        tool_call_id = tool_call["id"]
+        function_call = tool_call.get("function", {})
+        _, func_return = await self.a_execute_function(function_call, call_id=tool_call_id)
+        return {
+            "tool_call_id": tool_call_id,
+            "role": "tool",
+            "content": func_return.get("content", ""),
+        }
+
+    async def a_generate_tool_calls_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[dict[str, Any]]]:
+        """Generate a reply using async function call."""
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        async_tool_calls = []
+        for tool_call in message.get("tool_calls", []):
+            async_tool_calls.append(self._a_execute_tool_call(tool_call))
+        if async_tool_calls:
+            tool_returns = await asyncio.gather(*async_tool_calls)
+            return True, {
+                "role": "tool",
+                "tool_responses": tool_returns,
+                "content": "\n\n".join([self._str_for_tool_response(tool_return) for tool_return in tool_returns]),
+            }
+
+        return False, None
+
+    def check_termination_and_human_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Union[str, None]]:
+        """Check if the conversation should be terminated, and if human reply is provided.
+
+        This method checks for conditions that require the conversation to be terminated, such as reaching
+        a maximum number of consecutive auto-replies or encountering a termination message. Additionally,
+        it prompts for and processes human input based on the configured human input mode, which can be
+        'ALWAYS', 'NEVER', or 'TERMINATE'. The method also manages the consecutive auto-reply counter
+        for the conversation and prints relevant messages based on the human input received.
+
+        Args:
+            messages: A list of message dictionaries, representing the conversation history.
+            sender: The agent object representing the sender of the message.
+            config: Configuration object, defaults to the current instance if not provided.
+
+        Returns:
+            A tuple containing a boolean indicating if the conversation
+            should be terminated, and a human reply which can be a string, a dictionary, or None.
+        """
+        iostream = IOStream.get_default()
+
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender] if sender else []
+
+        termination_reason = None
+
+        # if there are no messages, continue the conversation
+        if not messages:
+            return False, None
+        message = messages[-1]
+
+        reply = ""
+        no_human_input_msg = ""
+        sender_name = "the sender" if sender is None else sender.name
+        if self.human_input_mode == "ALWAYS":
+            reply = self.get_human_input(
+                f"Replying as {self.name}. Provide feedback to {sender_name}. Press enter to skip and use auto-reply, or type 'exit' to end the conversation: "
+            )
+            no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+            # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+            if not reply and self._is_termination_msg(message):
+                termination_reason = f"Termination message condition on agent '{self.name}' met"
+            elif reply == "exit":
+                termination_reason = "User requested to end the conversation"
+
+            reply = reply if reply or not self._is_termination_msg(message) else "exit"
+        else:
+            if self._consecutive_auto_reply_counter[sender] >= self._max_consecutive_auto_reply_dict[sender]:
+                if self.human_input_mode == "NEVER":
+                    termination_reason = "Maximum number of consecutive auto-replies reached"
+                    reply = "exit"
+                else:
+                    # self.human_input_mode == "TERMINATE":
+                    terminate = self._is_termination_msg(message)
+                    reply = self.get_human_input(
+                        f"Please give feedback to {sender_name}. Press enter or type 'exit' to stop the conversation: "
+                        if terminate
+                        else f"Please give feedback to {sender_name}. Press enter to skip and use auto-reply, or type 'exit' to stop the conversation: "
+                    )
+                    no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+                    # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+                    if reply != "exit" and terminate:
+                        termination_reason = (
+                            f"Termination message condition on agent '{self.name}' met and no human input provided"
+                        )
+                    elif reply == "exit":
+                        termination_reason = "User requested to end the conversation"
+
+                    reply = reply if reply or not terminate else "exit"
+            elif self._is_termination_msg(message):
+                if self.human_input_mode == "NEVER":
+                    termination_reason = f"Termination message condition on agent '{self.name}' met"
+                    reply = "exit"
+                else:
+                    # self.human_input_mode == "TERMINATE":
+                    reply = self.get_human_input(
+                        f"Please give feedback to {sender_name}. Press enter or type 'exit' to stop the conversation: "
+                    )
+                    no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+
+                    # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+                    if not reply or reply == "exit":
+                        termination_reason = (
+                            f"Termination message condition on agent '{self.name}' met and no human input provided"
+                        )
+
+                    reply = reply or "exit"
+
+        # print the no_human_input_msg
+        if no_human_input_msg:
+            iostream.send(
+                TerminationAndHumanReplyNoInputEvent(
+                    no_human_input_msg=no_human_input_msg, sender=sender, recipient=self
+                )
+            )
+
+        # stop the conversation
+        if reply == "exit":
+            # reset the consecutive_auto_reply_counter
+            self._consecutive_auto_reply_counter[sender] = 0
+
+            if termination_reason:
+                iostream.send(TerminationEvent(termination_reason=termination_reason))
+
+            return True, None
+
+        # send the human reply
+        if reply or self._max_consecutive_auto_reply_dict[sender] == 0:
+            # reset the consecutive_auto_reply_counter
+            self._consecutive_auto_reply_counter[sender] = 0
+            # User provided a custom response, return function and tool failures indicating user interruption
+            tool_returns = []
+            if message.get("function_call", False):
+                tool_returns.append({
+                    "role": "function",
+                    "name": message["function_call"].get("name", ""),
+                    "content": "USER INTERRUPTED",
+                })
+
+            if message.get("tool_calls", False):
+                tool_returns.extend([
+                    {"role": "tool", "tool_call_id": tool_call.get("id", ""), "content": "USER INTERRUPTED"}
+                    for tool_call in message["tool_calls"]
+                ])
+
+            response = {"role": "user", "content": reply}
+            if tool_returns:
+                response["tool_responses"] = tool_returns
+
+            return True, response
+
+        # increment the consecutive_auto_reply_counter
+        self._consecutive_auto_reply_counter[sender] += 1
+        if self.human_input_mode != "NEVER":
+            iostream.send(UsingAutoReplyEvent(human_input_mode=self.human_input_mode, sender=sender, recipient=self))
+
+        return False, None
+
+    async def a_check_termination_and_human_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Union[str, None]]:
+        """(async) Check if the conversation should be terminated, and if human reply is provided.
+
+        This method checks for conditions that require the conversation to be terminated, such as reaching
+        a maximum number of consecutive auto-replies or encountering a termination message. Additionally,
+        it prompts for and processes human input based on the configured human input mode, which can be
+        'ALWAYS', 'NEVER', or 'TERMINATE'. The method also manages the consecutive auto-reply counter
+        for the conversation and prints relevant messages based on the human input received.
+
+        Args:
+            messages (Optional[List[Dict]]): A list of message dictionaries, representing the conversation history.
+            sender (Optional[Agent]): The agent object representing the sender of the message.
+            config (Optional[Any]): Configuration object, defaults to the current instance if not provided.
+
+        Returns:
+            Tuple[bool, Union[str, Dict, None]]: A tuple containing a boolean indicating if the conversation
+            should be terminated, and a human reply which can be a string, a dictionary, or None.
+        """
+        iostream = IOStream.get_default()
+
+        if config is None:
+            config = self
+        if messages is None:
+            messages = self._oai_messages[sender] if sender else []
+
+        termination_reason = None
+
+        message = messages[-1] if messages else {}
+        reply = ""
+        no_human_input_msg = ""
+        sender_name = "the sender" if sender is None else sender.name
+        if self.human_input_mode == "ALWAYS":
+            reply = await self.a_get_human_input(
+                f"Replying as {self.name}. Provide feedback to {sender_name}. Press enter to skip and use auto-reply, or type 'exit' to end the conversation: "
+            )
+            no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+            # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+            if not reply and self._is_termination_msg(message):
+                termination_reason = f"Termination message condition on agent '{self.name}' met"
+            elif reply == "exit":
+                termination_reason = "User requested to end the conversation"
+
+            reply = reply if reply or not self._is_termination_msg(message) else "exit"
+        else:
+            if self._consecutive_auto_reply_counter[sender] >= self._max_consecutive_auto_reply_dict[sender]:
+                if self.human_input_mode == "NEVER":
+                    termination_reason = "Maximum number of consecutive auto-replies reached"
+                    reply = "exit"
+                else:
+                    # self.human_input_mode == "TERMINATE":
+                    terminate = self._is_termination_msg(message)
+                    reply = await self.a_get_human_input(
+                        f"Please give feedback to {sender_name}. Press enter or type 'exit' to stop the conversation: "
+                        if terminate
+                        else f"Please give feedback to {sender_name}. Press enter to skip and use auto-reply, or type 'exit' to stop the conversation: "
+                    )
+                    no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+                    # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+                    if reply != "exit" and terminate:
+                        termination_reason = (
+                            f"Termination message condition on agent '{self.name}' met and no human input provided"
+                        )
+                    elif reply == "exit":
+                        termination_reason = "User requested to end the conversation"
+
+                    reply = reply if reply or not terminate else "exit"
+            elif self._is_termination_msg(message):
+                if self.human_input_mode == "NEVER":
+                    termination_reason = f"Termination message condition on agent '{self.name}' met"
+                    reply = "exit"
+                else:
+                    # self.human_input_mode == "TERMINATE":
+                    reply = await self.a_get_human_input(
+                        f"Please give feedback to {sender_name}. Press enter or type 'exit' to stop the conversation: "
+                    )
+                    no_human_input_msg = "NO HUMAN INPUT RECEIVED." if not reply else ""
+
+                    # if the human input is empty, and the message is a termination message, then we will terminate the conversation
+                    if not reply or reply == "exit":
+                        termination_reason = (
+                            f"Termination message condition on agent '{self.name}' met and no human input provided"
+                        )
+
+                    reply = reply or "exit"
+
+        # print the no_human_input_msg
+        if no_human_input_msg:
+            iostream.send(
+                TerminationAndHumanReplyNoInputEvent(
+                    no_human_input_msg=no_human_input_msg, sender=sender, recipient=self
+                )
+            )
+
+        # stop the conversation
+        if reply == "exit":
+            # reset the consecutive_auto_reply_counter
+            self._consecutive_auto_reply_counter[sender] = 0
+
+            if termination_reason:
+                iostream.send(TerminationEvent(termination_reason=termination_reason))
+
+            return True, None
+
+        # send the human reply
+        if reply or self._max_consecutive_auto_reply_dict[sender] == 0:
+            # User provided a custom response, return function and tool results indicating user interruption
+            # reset the consecutive_auto_reply_counter
+            self._consecutive_auto_reply_counter[sender] = 0
+            tool_returns = []
+            if message.get("function_call", False):
+                tool_returns.append({
+                    "role": "function",
+                    "name": message["function_call"].get("name", ""),
+                    "content": "USER INTERRUPTED",
+                })
+
+            if message.get("tool_calls", False):
+                tool_returns.extend([
+                    {"role": "tool", "tool_call_id": tool_call.get("id", ""), "content": "USER INTERRUPTED"}
+                    for tool_call in message["tool_calls"]
+                ])
+
+            response = {"role": "user", "content": reply}
+            if tool_returns:
+                response["tool_responses"] = tool_returns
+
+            return True, response
+
+        # increment the consecutive_auto_reply_counter
+        self._consecutive_auto_reply_counter[sender] += 1
+        if self.human_input_mode != "NEVER":
+            iostream.send(UsingAutoReplyEvent(human_input_mode=self.human_input_mode, sender=sender, recipient=self))
+
+        return False, None
+
+    def generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Optional[Union[str, dict[str, Any]]]:
+        """Reply based on the conversation history and the sender.
+
+        Either messages or sender must be provided.
+        Register a reply_func with `None` as one trigger for it to be activated when `messages` is non-empty and `sender` is `None`.
+        Use registered auto reply functions to generate replies.
+        By default, the following functions are checked in order:
+        1. check_termination_and_human_reply
+        2. generate_function_call_reply (deprecated in favor of tool_calls)
+        3. generate_tool_calls_reply
+        4. generate_code_execution_reply
+        5. generate_oai_reply
+        Every function returns a tuple (final, reply).
+        When a function returns final=False, the next function will be checked.
+        So by default, termination and human reply will be checked first.
+        If not terminating and human reply is skipped, execute function or code and return the result.
+        AI replies are generated only when no code execution is performed.
+
+        Args:
+            messages: a list of messages in the conversation history.
+            sender: sender of an Agent instance.
+            **kwargs (Any): Additional arguments to customize reply generation. Supported kwargs:
+                - exclude (List[Callable[..., Any]]): A list of reply functions to exclude from
+                the reply generation process. Functions in this list will be skipped even if
+                they would normally be triggered.
+
+        Returns:
+            str or dict or None: reply. None if no reply is generated.
+        """
+        if all((messages is None, sender is None)):
+            error_msg = f"Either {messages=} or {sender=} must be provided."
+            logger.error(error_msg)
+            raise AssertionError(error_msg)
+
+        if messages is None:
+            messages = self._oai_messages[sender]
+
+        # Call the hookable method that gives registered hooks a chance to update agent state, used for their context variables.
+        self.update_agent_state_before_reply(messages)
+
+        # Call the hookable method that gives registered hooks a chance to process the last message.
+        # Message modifications do not affect the incoming messages or self._oai_messages.
+        messages = self.process_last_received_message(messages)
+
+        # Call the hookable method that gives registered hooks a chance to process all messages.
+        # Message modifications do not affect the incoming messages or self._oai_messages.
+        messages = self.process_all_messages_before_reply(messages)
+
+        for reply_func_tuple in self._reply_func_list:
+            reply_func = reply_func_tuple["reply_func"]
+            if "exclude" in kwargs and reply_func in kwargs["exclude"]:
+                continue
+            if inspect.iscoroutinefunction(reply_func):
+                continue
+            if self._match_trigger(reply_func_tuple["trigger"], sender):
+                final, reply = reply_func(self, messages=messages, sender=sender, config=reply_func_tuple["config"])
+                if logging_enabled():
+                    log_event(
+                        self,
+                        "reply_func_executed",
+                        reply_func_module=reply_func.__module__,
+                        reply_func_name=reply_func.__name__,
+                        final=final,
+                        reply=reply,
+                    )
+                if final:
+                    return reply
+        return self._default_auto_reply
+
+    async def a_generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Union[str, dict[str, Any], None]:
+        """(async) Reply based on the conversation history and the sender.
+
+        Either messages or sender must be provided.
+        Register a reply_func with `None` as one trigger for it to be activated when `messages` is non-empty and `sender` is `None`.
+        Use registered auto reply functions to generate replies.
+        By default, the following functions are checked in order:
+        1. check_termination_and_human_reply
+        2. generate_function_call_reply
+        3. generate_tool_calls_reply
+        4. generate_code_execution_reply
+        5. generate_oai_reply
+        Every function returns a tuple (final, reply).
+        When a function returns final=False, the next function will be checked.
+        So by default, termination and human reply will be checked first.
+        If not terminating and human reply is skipped, execute function or code and return the result.
+        AI replies are generated only when no code execution is performed.
+
+        Args:
+            messages: a list of messages in the conversation history.
+            sender: sender of an Agent instance.
+            **kwargs (Any): Additional arguments to customize reply generation. Supported kwargs:
+                - exclude (List[Callable[..., Any]]): A list of reply functions to exclude from
+                the reply generation process. Functions in this list will be skipped even if
+                they would normally be triggered.
+
+        Returns:
+            str or dict or None: reply. None if no reply is generated.
+        """
+        if all((messages is None, sender is None)):
+            error_msg = f"Either {messages=} or {sender=} must be provided."
+            logger.error(error_msg)
+            raise AssertionError(error_msg)
+
+        if messages is None:
+            messages = self._oai_messages[sender]
+
+        # Call the hookable method that gives registered hooks a chance to update agent state, used for their context variables.
+        self.update_agent_state_before_reply(messages)
+
+        # Call the hookable method that gives registered hooks a chance to process the last message.
+        # Message modifications do not affect the incoming messages or self._oai_messages.
+        messages = self.process_last_received_message(messages)
+
+        # Call the hookable method that gives registered hooks a chance to process all messages.
+        # Message modifications do not affect the incoming messages or self._oai_messages.
+        messages = self.process_all_messages_before_reply(messages)
+
+        for reply_func_tuple in self._reply_func_list:
+            reply_func = reply_func_tuple["reply_func"]
+            if "exclude" in kwargs and reply_func in kwargs["exclude"]:
+                continue
+
+            if self._match_trigger(reply_func_tuple["trigger"], sender):
+                if inspect.iscoroutinefunction(reply_func):
+                    final, reply = await reply_func(
+                        self, messages=messages, sender=sender, config=reply_func_tuple["config"]
+                    )
+                else:
+                    final, reply = reply_func(self, messages=messages, sender=sender, config=reply_func_tuple["config"])
+                if final:
+                    return reply
+        return self._default_auto_reply
+
+    def _match_trigger(self, trigger: Union[None, str, type, Agent, Callable, list], sender: Optional[Agent]) -> bool:
+        """Check if the sender matches the trigger.
+
+        Args:
+            trigger (Union[None, str, type, Agent, Callable, List]): The condition to match against the sender.
+            Can be `None`, string, type, `Agent` instance, callable, or a list of these.
+            sender (Agent): The sender object or type to be matched against the trigger.
+
+        Returns:
+            `True` if the sender matches the trigger, otherwise `False`.
+
+        Raises:
+            ValueError: If the trigger type is unsupported.
+        """
+        if trigger is None:
+            return sender is None
+        elif isinstance(trigger, str):
+            if sender is None:
+                raise SenderRequiredError()
+            return trigger == sender.name
+        elif isinstance(trigger, type):
+            return isinstance(sender, trigger)
+        elif isinstance(trigger, Agent):
+            # return True if the sender is the same type (class) as the trigger
+            return trigger == sender
+        elif isinstance(trigger, Callable):
+            rst = trigger(sender)
+            assert isinstance(rst, bool), f"trigger {trigger} must return a boolean value."
+            return rst
+        elif isinstance(trigger, list):
+            return any(self._match_trigger(t, sender) for t in trigger)
+        else:
+            raise ValueError(f"Unsupported trigger type: {type(trigger)}")
+
+    def get_human_input(self, prompt: str) -> str:
+        """Get human input.
+
+        Override this method to customize the way to get human input.
+
+        Args:
+            prompt (str): prompt for the human input.
+
+        Returns:
+            str: human input.
+        """
+        iostream = IOStream.get_default()
+
+        reply = iostream.input(prompt)
+        self._human_input.append(reply)
+        return reply
+
+    async def a_get_human_input(self, prompt: str) -> str:
+        """(Async) Get human input.
+
+        Override this method to customize the way to get human input.
+
+        Args:
+            prompt (str): prompt for the human input.
+
+        Returns:
+            str: human input.
+        """
+        iostream = IOStream.get_default()
+
+        reply = await iostream.input(prompt)
+        self._human_input.append(reply)
+        return reply
+
+        # def _get_human_input(
+        #     self, iostream: IOStream, prompt: str,
+        # ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        #     with IOStream.set_default(iostream):
+        #         print("!"*100)
+        #         print("Getting human input...")
+        #         return self.get_human_input(prompt)
+
+        # return await asyncio.get_event_loop().run_in_executor(
+        #     None,
+        #     functools.partial(
+        #         _get_human_input, self=self, iostream=iostream, prompt=prompt,
+        #     ),
+        # )
+
+    def run_code(self, code: str, **kwargs: Any) -> tuple[int, str, Optional[str]]:
+        """Run the code and return the result.
+
+        Override this function to modify the way to run the code.
+
+        Args:
+            code (str): the code to be executed.
+            **kwargs: other keyword arguments.
+
+        Returns:
+            A tuple of (exitcode, logs, image).
+            exitcode (int): the exit code of the code execution.
+            logs (str): the logs of the code execution.
+            image (str or None): the docker image used for the code execution.
+        """
+        return execute_code(code, **kwargs)
+
+    def execute_code_blocks(self, code_blocks):
+        """Execute the code blocks and return the result."""
+        iostream = IOStream.get_default()
+
+        logs_all = ""
+        for i, code_block in enumerate(code_blocks):
+            lang, code = code_block
+            if not lang:
+                lang = infer_lang(code)
+
+            iostream.send(ExecuteCodeBlockEvent(code=code, language=lang, code_block_count=i, recipient=self))
+
+            if lang in ["bash", "shell", "sh"]:
+                exitcode, logs, image = self.run_code(code, lang=lang, **self._code_execution_config)
+            elif lang in PYTHON_VARIANTS:
+                filename = code[11 : code.find("\n")].strip() if code.startswith("# filename: ") else None
+                exitcode, logs, image = self.run_code(
+                    code,
+                    lang="python",
+                    filename=filename,
+                    **self._code_execution_config,
+                )
+            else:
+                # In case the language is not supported, we return an error message.
+                exitcode, logs, image = (
+                    1,
+                    f"unknown language {lang}",
+                    None,
+                )
+                # raise NotImplementedError
+            if image is not None:
+                self._code_execution_config["use_docker"] = image
+            logs_all += "\n" + logs
+            if exitcode != 0:
+                return exitcode, logs_all
+        return exitcode, logs_all
+
+    @staticmethod
+    def _format_json_str(jstr):
+        """Remove newlines outside of quotes, and handle JSON escape sequences.
+
+        1. this function removes the newline in the query outside of quotes otherwise json.loads(s) will fail.
+            Ex 1:
+            "{\n"tool": "python",\n"query": "print('hello')\nprint('world')"\n}" -> "{"tool": "python","query": "print('hello')\nprint('world')"}"
+            Ex 2:
+            "{\n  \"location\": \"Boston, MA\"\n}" -> "{"location": "Boston, MA"}"
+
+        2. this function also handles JSON escape sequences inside quotes.
+            Ex 1:
+            '{"args": "a\na\na\ta"}' -> '{"args": "a\\na\\na\\ta"}'
+        """
+        result = []
+        inside_quotes = False
+        last_char = " "
+        for char in jstr:
+            if last_char != "\\" and char == '"':
+                inside_quotes = not inside_quotes
+            last_char = char
+            if not inside_quotes and char == "\n":
+                continue
+            if inside_quotes and char == "\n":
+                char = "\\n"
+            if inside_quotes and char == "\t":
+                char = "\\t"
+            result.append(char)
+        return "".join(result)
+
+    def execute_function(
+        self, func_call: dict[str, Any], call_id: Optional[str] = None, verbose: bool = False
+    ) -> tuple[bool, dict[str, Any]]:
+        """Execute a function call and return the result.
+
+        Override this function to modify the way to execute function and tool calls.
+
+        Args:
+            func_call: a dictionary extracted from openai message at "function_call" or "tool_calls" with keys "name" and "arguments".
+            call_id: a string to identify the tool call.
+            verbose (bool): Whether to send messages about the execution details to the
+                output stream. When True, both the function call arguments and the execution
+                result will be displayed. Defaults to False.
+
+
+        Returns:
+            A tuple of (is_exec_success, result_dict).
+            is_exec_success (boolean): whether the execution is successful.
+            result_dict: a dictionary with keys "name", "role", and "content". Value of "role" is "function".
+
+        "function_call" deprecated as of [OpenAI API v1.1.0](https://github.com/openai/openai-python/releases/tag/v1.1.0)
+        See https://platform.openai.com/docs/api-reference/chat/create#chat-create-function_call
+        """
+        iostream = IOStream.get_default()
+
+        func_name = func_call.get("name", "")
+        func = self._function_map.get(func_name, None)
+
+        is_exec_success = False
+        if func is not None:
+            # Extract arguments from a json-like string and put it into a dict.
+            input_string = self._format_json_str(func_call.get("arguments", "{}"))
+            try:
+                arguments = json.loads(input_string)
+            except json.JSONDecodeError as e:
+                arguments = None
+                content = f"Error: {e}\n The argument must be in JSON format."
+
+            # Try to execute the function
+            if arguments is not None:
+                iostream.send(
+                    ExecuteFunctionEvent(func_name=func_name, call_id=call_id, arguments=arguments, recipient=self)
+                )
+                try:
+                    content = func(**arguments)
+                    is_exec_success = True
+                except Exception as e:
+                    content = f"Error: {e}"
+        else:
+            arguments = {}
+            content = f"Error: Function {func_name} not found."
+
+        iostream.send(
+            ExecutedFunctionEvent(
+                func_name=func_name,
+                call_id=call_id,
+                arguments=arguments,
+                content=content,
+                recipient=self,
+                is_exec_success=is_exec_success,
+            )
+        )
+
+        return is_exec_success, {
+            "name": func_name,
+            "role": "function",
+            "content": content,
+        }
+
+    async def a_execute_function(
+        self, func_call: dict[str, Any], call_id: Optional[str] = None, verbose: bool = False
+    ) -> tuple[bool, dict[str, Any]]:
+        """Execute an async function call and return the result.
+
+        Override this function to modify the way async functions and tools are executed.
+
+        Args:
+            func_call: a dictionary extracted from openai message at key "function_call" or "tool_calls" with keys "name" and "arguments".
+            call_id: a string to identify the tool call.
+            verbose (bool): Whether to send messages about the execution details to the
+                output stream. When True, both the function call arguments and the execution
+                result will be displayed. Defaults to False.
+
+        Returns:
+            A tuple of (is_exec_success, result_dict).
+            is_exec_success (boolean): whether the execution is successful.
+            result_dict: a dictionary with keys "name", "role", and "content". Value of "role" is "function".
+
+        "function_call" deprecated as of [OpenAI API v1.1.0](https://github.com/openai/openai-python/releases/tag/v1.1.0)
+        See https://platform.openai.com/docs/api-reference/chat/create#chat-create-function_call
+        """
+        iostream = IOStream.get_default()
+
+        func_name = func_call.get("name", "")
+        func = self._function_map.get(func_name, None)
+
+        is_exec_success = False
+        if func is not None:
+            # Extract arguments from a json-like string and put it into a dict.
+            input_string = self._format_json_str(func_call.get("arguments", "{}"))
+            try:
+                arguments = json.loads(input_string)
+            except json.JSONDecodeError as e:
+                arguments = None
+                content = f"Error: {e}\n The argument must be in JSON format."
+
+            # Try to execute the function
+            if arguments is not None:
+                iostream.send(
+                    ExecuteFunctionEvent(func_name=func_name, call_id=call_id, arguments=arguments, recipient=self)
+                )
+                try:
+                    if inspect.iscoroutinefunction(func):
+                        content = await func(**arguments)
+                    else:
+                        # Fallback to sync function if the function is not async
+                        content = func(**arguments)
+                    is_exec_success = True
+                except Exception as e:
+                    content = f"Error: {e}"
+        else:
+            arguments = {}
+            content = f"Error: Function {func_name} not found."
+
+        iostream.send(
+            ExecutedFunctionEvent(
+                func_name=func_name,
+                call_id=call_id,
+                arguments=arguments,
+                content=content,
+                recipient=self,
+                is_exec_success=is_exec_success,
+            )
+        )
+
+        return is_exec_success, {
+            "name": func_name,
+            "role": "function",
+            "content": content,
+        }
+
+    def generate_init_message(
+        self, message: Optional[Union[dict[str, Any], str]], **kwargs: Any
+    ) -> Union[str, dict[str, Any]]:
+        """Generate the initial message for the agent.
+        If message is None, input() will be called to get the initial message.
+
+        Args:
+            message (str or None): the message to be processed.
+            **kwargs: any additional information. It has the following reserved fields:
+                "carryover": a string or a list of string to specify the carryover information to be passed to this chat. It can be a string or a list of string.
+                    If provided, we will combine this carryover with the "message" content when generating the initial chat
+                    message.
+
+        Returns:
+            str or dict: the processed message.
+        """
+        if message is None:
+            message = self.get_human_input(">")
+
+        return self._handle_carryover(message, kwargs)
+
+    def _handle_carryover(self, message: Union[str, dict[str, Any]], kwargs: dict) -> Union[str, dict[str, Any]]:
+        if not kwargs.get("carryover"):
+            return message
+
+        if isinstance(message, str):
+            return self._process_carryover(message, kwargs)
+
+        elif isinstance(message, dict):
+            if isinstance(message.get("content"), str):
+                # Makes sure the original message is not mutated
+                message = message.copy()
+                message["content"] = self._process_carryover(message["content"], kwargs)
+            elif isinstance(message.get("content"), list):
+                # Makes sure the original message is not mutated
+                message = message.copy()
+                message["content"] = self._process_multimodal_carryover(message["content"], kwargs)
+        else:
+            raise InvalidCarryOverTypeError("Carryover should be a string or a list of strings.")
+
+        return message
+
+    def _process_carryover(self, content: str, kwargs: dict) -> str:
+        # Makes sure there's a carryover
+        if not kwargs.get("carryover"):
+            return content
+
+        # if carryover is string
+        if isinstance(kwargs["carryover"], str):
+            content += "\nContext: \n" + kwargs["carryover"]
+        elif isinstance(kwargs["carryover"], list):
+            content += "\nContext: \n" + ("\n").join([_post_process_carryover_item(t) for t in kwargs["carryover"]])
+        else:
+            raise InvalidCarryOverTypeError(
+                "Carryover should be a string or a list of strings. Not adding carryover to the message."
+            )
+        return content
+
+    def _process_multimodal_carryover(self, content: list[dict[str, Any]], kwargs: dict) -> list[dict[str, Any]]:
+        """Prepends the context to a multimodal message."""
+        # Makes sure there's a carryover
+        if not kwargs.get("carryover"):
+            return content
+
+        return [{"type": "text", "text": self._process_carryover("", kwargs)}] + content
+
+    async def a_generate_init_message(
+        self, message: Optional[Union[dict[str, Any], str]], **kwargs: Any
+    ) -> Union[str, dict[str, Any]]:
+        """Generate the initial message for the agent.
+        If message is None, input() will be called to get the initial message.
+
+        Args:
+            message (str or None): the message to be processed.
+            **kwargs: any additional information. It has the following reserved fields:
+                "carryover": a string or a list of string to specify the carryover information to be passed to this chat. It can be a string or a list of string.
+                    If provided, we will combine this carryover with the "message" content when generating the initial chat
+                    message.
+
+        Returns:
+            str or dict: the processed message.
+        """
+        if message is None:
+            message = await self.a_get_human_input(">")
+
+        return self._handle_carryover(message, kwargs)
+
+    @property
+    def tools(self) -> list[Tool]:
+        """Get the agent's tools (registered for LLM)
+
+        Note this is a copy of the tools list, use add_tool and remove_tool to modify the tools list.
+        """
+        return self._tools.copy()
+
+    def remove_tool_for_llm(self, tool: Tool) -> None:
+        """Remove a tool (register for LLM tool)"""
+        try:
+            self._register_for_llm(tool=tool, api_style="tool", is_remove=True)
+            self._tools.remove(tool)
+        except ValueError:
+            raise ValueError(f"Tool {tool} not found in collection")
+
+    def register_function(self, function_map: dict[str, Union[Callable[..., Any]]], silent_override: bool = False):
+        """Register functions to the agent.
+
+        Args:
+            function_map: a dictionary mapping function names to functions. if function_map[name] is None, the function will be removed from the function_map.
+            silent_override: whether to print warnings when overriding functions.
+        """
+        for name, func in function_map.items():
+            self._assert_valid_name(name)
+            if func is None and name not in self._function_map:
+                warnings.warn(f"The function {name} to remove doesn't exist", name)
+            if not silent_override and name in self._function_map:
+                warnings.warn(f"Function '{name}' is being overridden.", UserWarning)
+        self._function_map.update(function_map)
+        self._function_map = {k: v for k, v in self._function_map.items() if v is not None}
+
+    def update_function_signature(
+        self, func_sig: Union[str, dict[str, Any]], is_remove: None, silent_override: bool = False
+    ):
+        """Update a function_signature in the LLM configuration for function_call.
+
+        Args:
+            func_sig (str or dict): description/name of the function to update/remove to the model. See: https://platform.openai.com/docs/api-reference/chat/create#chat/create-functions
+            is_remove: whether removing the function from llm_config with name 'func_sig'
+            silent_override: whether to print warnings when overriding functions.
+
+        Deprecated as of [OpenAI API v1.1.0](https://github.com/openai/openai-python/releases/tag/v1.1.0)
+        See https://platform.openai.com/docs/api-reference/chat/create#chat-create-function_call
+        """
+        if not isinstance(self.llm_config, (dict, LLMConfig)):
+            error_msg = "To update a function signature, agent must have an llm_config"
+            logger.error(error_msg)
+            raise AssertionError(error_msg)
+
+        if is_remove:
+            if "functions" not in self.llm_config or len(self.llm_config["functions"]) == 0:
+                error_msg = f"The agent config doesn't have function {func_sig}."
+                logger.error(error_msg)
+                raise AssertionError(error_msg)
+            else:
+                self.llm_config["functions"] = [
+                    func for func in self.llm_config["functions"] if func["name"] != func_sig
+                ]
+        else:
+            if not isinstance(func_sig, dict):
+                raise ValueError(
+                    f"The function signature must be of the type dict. Received function signature type {type(func_sig)}"
+                )
+            if "name" not in func_sig:
+                raise ValueError(f"The function signature must have a 'name' key. Received: {func_sig}")
+            self._assert_valid_name(func_sig["name"]), func_sig
+            if "functions" in self.llm_config:
+                if not silent_override and any(
+                    func["name"] == func_sig["name"] for func in self.llm_config["functions"]
+                ):
+                    warnings.warn(f"Function '{func_sig['name']}' is being overridden.", UserWarning)
+
+                self.llm_config["functions"] = [
+                    func for func in self.llm_config["functions"] if func.get("name") != func_sig["name"]
+                ] + [func_sig]
+            else:
+                self.llm_config["functions"] = [func_sig]
+
+        # Do this only if llm_config is a dict. If llm_config is LLMConfig, LLMConfig will handle this.
+        if len(self.llm_config["functions"]) == 0 and isinstance(self.llm_config, dict):
+            del self.llm_config["functions"]
+
+        self.client = OpenAIWrapper(**self.llm_config)
+
+    def update_tool_signature(
+        self, tool_sig: Union[str, dict[str, Any]], is_remove: bool, silent_override: bool = False
+    ):
+        """Update a tool_signature in the LLM configuration for tool_call.
+
+        Args:
+            tool_sig (str or dict): description/name of the tool to update/remove to the model. See: https://platform.openai.com/docs/api-reference/chat/create#chat-create-tools
+            is_remove: whether removing the tool from llm_config with name 'tool_sig'
+            silent_override: whether to print warnings when overriding functions.
+        """
+        if not self.llm_config:
+            error_msg = "To update a tool signature, agent must have an llm_config"
+            logger.error(error_msg)
+            raise AssertionError(error_msg)
+
+        if is_remove:
+            if "tools" not in self.llm_config or len(self.llm_config["tools"]) == 0:
+                error_msg = f"The agent config doesn't have tool {tool_sig}."
+                logger.error(error_msg)
+                raise AssertionError(error_msg)
+            else:
+                current_tools = self.llm_config["tools"]
+                filtered_tools = []
+
+                # Loop through and rebuild tools list without the tool to remove
+                for tool in current_tools:
+                    tool_name = tool["function"]["name"]
+
+                    # Match by tool name, or by tool signature
+                    is_different = tool_name != tool_sig if isinstance(tool_sig, str) else tool != tool_sig
+
+                    if is_different:
+                        filtered_tools.append(tool)
+
+                self.llm_config["tools"] = filtered_tools
+        else:
+            if not isinstance(tool_sig, dict):
+                raise ValueError(
+                    f"The tool signature must be of the type dict. Received tool signature type {type(tool_sig)}"
+                )
+            self._assert_valid_name(tool_sig["function"]["name"])
+            if "tools" in self.llm_config and len(self.llm_config["tools"]) > 0:
+                if not silent_override and any(
+                    tool["function"]["name"] == tool_sig["function"]["name"] for tool in self.llm_config["tools"]
+                ):
+                    warnings.warn(f"Function '{tool_sig['function']['name']}' is being overridden.", UserWarning)
+                self.llm_config["tools"] = [
+                    tool
+                    for tool in self.llm_config["tools"]
+                    if tool.get("function", {}).get("name") != tool_sig["function"]["name"]
+                ] + [tool_sig]
+            else:
+                self.llm_config["tools"] = [tool_sig]
+
+        # Do this only if llm_config is a dict. If llm_config is LLMConfig, LLMConfig will handle this.
+        if len(self.llm_config["tools"]) == 0 and isinstance(self.llm_config, dict):
+            del self.llm_config["tools"]
+
+        self.client = OpenAIWrapper(**self.llm_config)
+
+    def can_execute_function(self, name: Union[list[str], str]) -> bool:
+        """Whether the agent can execute the function."""
+        names = name if isinstance(name, list) else [name]
+        return all([n in self._function_map for n in names])
+
+    @property
+    def function_map(self) -> dict[str, Callable[..., Any]]:
+        """Return the function map."""
+        return self._function_map
+
+    def _wrap_function(self, func: F, inject_params: dict[str, Any] = {}, *, serialize: bool = True) -> F:
+        """Wrap the function inject chat context parameters and to dump the return value to json.
+
+        Handles both sync and async functions.
+
+        Args:
+            func: the function to be wrapped.
+            inject_params: the chat context parameters which will be passed to the function.
+            serialize: whether to serialize the return value
+
+        Returns:
+            The wrapped function.
+        """
+
+        @load_basemodels_if_needed
+        @functools.wraps(func)
+        def _wrapped_func(*args, **kwargs):
+            retval = func(*args, **kwargs, **inject_params)
+            if logging_enabled():
+                log_function_use(self, func, kwargs, retval)
+            return serialize_to_str(retval) if serialize else retval
+
+        @load_basemodels_if_needed
+        @functools.wraps(func)
+        async def _a_wrapped_func(*args, **kwargs):
+            retval = await func(*args, **kwargs, **inject_params)
+            if logging_enabled():
+                log_function_use(self, func, kwargs, retval)
+            return serialize_to_str(retval) if serialize else retval
+
+        wrapped_func = _a_wrapped_func if inspect.iscoroutinefunction(func) else _wrapped_func
+
+        # needed for testing
+        wrapped_func._origin = func
+
+        return wrapped_func
+
+    @staticmethod
+    def _create_tool_if_needed(
+        func_or_tool: Union[F, Tool],
+        name: Optional[str],
+        description: Optional[str],
+    ) -> Tool:
+        if isinstance(func_or_tool, Tool):
+            tool: Tool = func_or_tool
+            # create new tool object if name or description is not None
+            if name or description:
+                tool = Tool(func_or_tool=tool, name=name, description=description)
+        elif inspect.isfunction(func_or_tool):
+            function: Callable[..., Any] = func_or_tool
+            tool = Tool(func_or_tool=function, name=name, description=description)
+        else:
+            raise TypeError(f"'func_or_tool' must be a function or a Tool object, got '{type(func_or_tool)}' instead.")
+        return tool
+
+    def register_for_llm(
+        self,
+        *,
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+        api_style: Literal["function", "tool"] = "tool",
+        silent_override: bool = False,
+    ) -> Callable[[Union[F, Tool]], Tool]:
+        """Decorator factory for registering a function to be used by an agent.
+
+        It's return value is used to decorate a function to be registered to the agent. The function uses type hints to
+        specify the arguments and return type. The function name is used as the default name for the function,
+        but a custom name can be provided. The function description is used to describe the function in the
+        agent's configuration.
+
+        Args:
+            name (optional(str)): name of the function. If None, the function name will be used (default: None).
+            description (optional(str)): description of the function (default: None). It is mandatory
+                for the initial decorator, but the following ones can omit it.
+            api_style: (literal): the API style for function call.
+                For Azure OpenAI API, use version 2023-12-01-preview or later.
+                `"function"` style will be deprecated. For earlier version use
+                `"function"` if `"tool"` doesn't work.
+                See [Azure OpenAI documentation](https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/function-calling?tabs=python) for details.
+            silent_override (bool): whether to suppress any override warning messages.
+
+        Returns:
+            The decorator for registering a function to be used by an agent.
+
+        Examples:
+            ```
+            @user_proxy.register_for_execution()
+            @agent2.register_for_llm()
+            @agent1.register_for_llm(description="This is a very useful function")
+            def my_function(a: Annotated[str, "description of a parameter"] = "a", b: int, c=3.14) -> str:
+                 return a + str(b * c)
+            ```
+
+            For Azure OpenAI versions prior to 2023-12-01-preview, set `api_style`
+            to `"function"` if `"tool"` doesn't work:
+            ```
+            @agent2.register_for_llm(api_style="function")
+            def my_function(a: Annotated[str, "description of a parameter"] = "a", b: int, c=3.14) -> str:
+                 return a + str(b * c)
+            ```
+
+        """
+
+        def _decorator(
+            func_or_tool: Union[F, Tool], name: Optional[str] = name, description: Optional[str] = description
+        ) -> Tool:
+            """Decorator for registering a function to be used by an agent.
+
+            Args:
+                func_or_tool: The function or the tool to be registered.
+                name: The name of the function or the tool.
+                description: The description of the function or the tool.
+
+            Returns:
+                The function to be registered, with the _description attribute set to the function description.
+
+            Raises:
+                ValueError: if the function description is not provided and not propagated by a previous decorator.
+                RuntimeError: if the LLM config is not set up before registering a function.
+
+            """
+            tool = self._create_tool_if_needed(func_or_tool, name, description)
+
+            self._register_for_llm(tool, api_style, silent_override=silent_override)
+            if tool not in self._tools:
+                self._tools.append(tool)
+
+            return tool
+
+        return _decorator
+
+    def _register_for_llm(
+        self, tool: Tool, api_style: Literal["tool", "function"], is_remove: bool = False, silent_override: bool = False
+    ) -> None:
+        """
+        Register a tool for LLM.
+
+        Args:
+            tool: the tool to be registered.
+            api_style: the API style for function call ("tool" or "function").
+            is_remove: whether to remove the function or tool.
+            silent_override: whether to suppress any override warning messages.
+
+        Returns:
+            None
+        """
+        # register the function to the agent if there is LLM config, raise an exception otherwise
+        if self.llm_config is None:
+            raise RuntimeError("LLM config must be setup before registering a function for LLM.")
+
+        if api_style == "function":
+            self.update_function_signature(tool.function_schema, is_remove=is_remove, silent_override=silent_override)
+        elif api_style == "tool":
+            self.update_tool_signature(tool.tool_schema, is_remove=is_remove, silent_override=silent_override)
+        else:
+            raise ValueError(f"Unsupported API style: {api_style}")
+
+    def set_ui_tools(self, tools: list[Tool]) -> None:
+        """Set the UI tools for the agent.
+
+        Args:
+            tools: a list of tools to be set.
+        """
+        # Unset the previous UI tools
+        self._unset_previous_ui_tools()
+
+        # Set the new UI tools
+        for tool in tools:
+            # Register the tool for LLM
+            self._register_for_llm(tool, api_style="tool", silent_override=True)
+            if tool not in self._tools:
+                self._tools.append(tool)
+
+            # Register for execution
+            self.register_for_execution(serialize=False, silent_override=True)(tool)
+
+        # Set the current UI tools
+        self._ui_tools = tools
+
+    def unset_ui_tools(self, tools: list[Tool]) -> None:
+        """Unset the UI tools for the agent.
+
+        Args:
+            tools: a list of tools to be unset.
+        """
+        for tool in tools:
+            self.remove_tool_for_llm(tool)
+
+    def _unset_previous_ui_tools(self) -> None:
+        """Unset the previous UI tools for the agent.
+
+        This is used to remove UI tools that were previously registered for LLM.
+        """
+        self.unset_ui_tools(self._ui_tools)
+        for tool in self._ui_tools:
+            if tool in self._tools:
+                self._tools.remove(tool)
+
+            # Unregister the function from the function map
+            if tool.name in self._function_map:
+                del self._function_map[tool.name]
+
+        self._ui_tools = []
+
+    def register_for_execution(
+        self,
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+        *,
+        serialize: bool = True,
+        silent_override: bool = False,
+    ) -> Callable[[Union[Tool, F]], Tool]:
+        """Decorator factory for registering a function to be executed by an agent.
+
+        It's return value is used to decorate a function to be registered to the agent.
+
+        Args:
+            name: name of the function. If None, the function name will be used (default: None).
+            description: description of the function (default: None).
+            serialize: whether to serialize the return value
+            silent_override: whether to suppress any override warning messages
+
+        Returns:
+            The decorator for registering a function to be used by an agent.
+
+        Examples:
+            ```
+            @user_proxy.register_for_execution()
+            @agent2.register_for_llm()
+            @agent1.register_for_llm(description="This is a very useful function")
+            def my_function(a: Annotated[str, "description of a parameter"] = "a", b: int, c=3.14):
+                 return a + str(b * c)
+            ```
+
+        """
+
+        def _decorator(
+            func_or_tool: Union[Tool, F], name: Optional[str] = name, description: Optional[str] = description
+        ) -> Tool:
+            """Decorator for registering a function to be used by an agent.
+
+            Args:
+                func_or_tool: the function or the tool to be registered.
+                name: the name of the function.
+                description: the description of the function.
+
+            Returns:
+                The tool to be registered.
+
+            """
+
+            tool = self._create_tool_if_needed(func_or_tool, name, description)
+            chat_context = ChatContext(self)
+            chat_context_params = {param: chat_context for param in tool._chat_context_param_names}
+
+            self.register_function(
+                {tool.name: self._wrap_function(tool.func, chat_context_params, serialize=serialize)},
+                silent_override=silent_override,
+            )
+
+            return tool
+
+        return _decorator
+
+    def register_model_client(self, model_client_cls: ModelClient, **kwargs: Any):
+        """Register a model client.
+
+        Args:
+            model_client_cls: A custom client class that follows the Client interface
+            **kwargs: The kwargs for the custom client class to be initialized with
+        """
+        self.client.register_model_client(model_client_cls, **kwargs)
+
+    def register_hook(self, hookable_method: str, hook: Callable):
+        """Registers a hook to be called by a hookable method, in order to add a capability to the agent.
+        Registered hooks are kept in lists (one per hookable method), and are called in their order of registration.
+
+        Args:
+            hookable_method: A hookable method name implemented by ConversableAgent.
+            hook: A method implemented by a subclass of AgentCapability.
+        """
+        assert hookable_method in self.hook_lists, f"{hookable_method} is not a hookable method."
+        hook_list = self.hook_lists[hookable_method]
+        assert hook not in hook_list, f"{hook} is already registered as a hook."
+        hook_list.append(hook)
+
+    def update_agent_state_before_reply(self, messages: list[dict[str, Any]]) -> None:
+        """Calls any registered capability hooks to update the agent's state.
+        Primarily used to update context variables.
+        Will, potentially, modify the messages.
+        """
+        hook_list = self.hook_lists["update_agent_state"]
+
+        # Call each hook (in order of registration) to process the messages.
+        for hook in hook_list:
+            hook(self, messages)
+
+    def process_all_messages_before_reply(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Calls any registered capability hooks to process all messages, potentially modifying the messages."""
+        hook_list = self.hook_lists["process_all_messages_before_reply"]
+        # If no hooks are registered, or if there are no messages to process, return the original message list.
+        if len(hook_list) == 0 or messages is None:
+            return messages
+
+        # Call each hook (in order of registration) to process the messages.
+        processed_messages = messages
+        for hook in hook_list:
+            processed_messages = hook(processed_messages)
+        return processed_messages
+
+    def process_last_received_message(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Calls any registered capability hooks to use and potentially modify the text of the last message,
+        as long as the last message is not a function call or exit command.
+        """
+        # If any required condition is not met, return the original message list.
+        hook_list = self.hook_lists["process_last_received_message"]
+        if len(hook_list) == 0:
+            return messages  # No hooks registered.
+        if messages is None:
+            return None  # No message to process.
+        if len(messages) == 0:
+            return messages  # No message to process.
+        last_message = messages[-1]
+        if "function_call" in last_message:
+            return messages  # Last message is a function call.
+        if "context" in last_message:
+            return messages  # Last message contains a context key.
+        if "content" not in last_message:
+            return messages  # Last message has no content.
+
+        user_content = last_message["content"]
+        if not isinstance(user_content, str) and not isinstance(user_content, list):
+            # if the user_content is a string, it is for regular LLM
+            # if the user_content is a list, it should follow the multimodal LMM format.
+            return messages
+        if user_content == "exit":
+            return messages  # Last message is an exit command.
+
+        # Call each hook (in order of registration) to process the user's message.
+        processed_user_content = user_content
+        for hook in hook_list:
+            processed_user_content = hook(processed_user_content)
+
+        if processed_user_content == user_content:
+            return messages  # No hooks actually modified the user's message.
+
+        # Replace the last user message with the expanded one.
+        messages = messages.copy()
+        messages[-1]["content"] = processed_user_content
+        return messages
+
+    def print_usage_summary(self, mode: Union[str, list[str]] = ["actual", "total"]) -> None:
+        """Print the usage summary."""
+        iostream = IOStream.get_default()
+        if self.client is None:
+            iostream.send(ConversableAgentUsageSummaryNoCostIncurredEvent(recipient=self))
+        else:
+            iostream.send(ConversableAgentUsageSummaryEvent(recipient=self))
+
+        if self.client is not None:
+            self.client.print_usage_summary(mode)
+
+    def get_actual_usage(self) -> Union[None, dict[str, int]]:
+        """Get the actual usage summary."""
+        if self.client is None:
+            return None
+        else:
+            return self.client.actual_usage_summary
+
+    def get_total_usage(self) -> Union[None, dict[str, int]]:
+        """Get the total usage summary."""
+        if self.client is None:
+            return None
+        else:
+            return self.client.total_usage_summary
+
+    @contextmanager
+    def _create_or_get_executor(
+        self,
+        executor_kwargs: Optional[dict[str, Any]] = None,
+        tools: Optional[Union[Tool, Iterable[Tool]]] = None,
+        agent_name: str = "executor",
+        agent_human_input_mode: str = "NEVER",
+    ) -> Generator["ConversableAgent", None, None]:
+        """Creates a user proxy / tool executor agent.
+
+        Note: Code execution is not enabled by default. Pass the code execution config into executor_kwargs, if needed.
+
+        Args:
+            executor_kwargs: agent's arguments.
+            tools: tools to register for execution with the agent.
+            agent_name: agent's name, defaults to 'executor'.
+            agent_human_input_mode: agent's human input mode, defaults to 'NEVER'.
+        """
+        if executor_kwargs is None:
+            executor_kwargs = {}
+        if "is_termination_msg" not in executor_kwargs:
+            executor_kwargs["is_termination_msg"] = lambda x: (x["content"] is not None) and "TERMINATE" in x["content"]
+
+        try:
+            if not self.run_executor:
+                self.run_executor = ConversableAgent(
+                    name=agent_name,
+                    human_input_mode=agent_human_input_mode,
+                    **executor_kwargs,
+                )
+
+            tools = [] if tools is None else tools
+            tools = [tools] if isinstance(tools, Tool) else tools
+            for tool in tools:
+                tool.register_for_execution(self.run_executor)
+                tool.register_for_llm(self)
+            yield self.run_executor
+        finally:
+            if tools is not None:
+                for tool in tools:
+                    self.update_tool_signature(tool_sig=tool.tool_schema["function"]["name"], is_remove=True)
+
+    def _deprecated_run(
+        self,
+        message: str,
+        *,
+        tools: Optional[Union[Tool, Iterable[Tool]]] = None,
+        executor_kwargs: Optional[dict[str, Any]] = None,
+        max_turns: Optional[int] = None,
+        msg_to: Literal["agent", "user"] = "agent",
+        clear_history: bool = False,
+        user_input: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+    ) -> ChatResult:
+        """Run a chat with the agent using the given message.
+
+        A second agent will be created to represent the user, this agent will by known by the name 'user'. This agent does not have code execution enabled by default, if needed pass the code execution config in with the executor_kwargs parameter.
+
+        The user can terminate the conversation when prompted or, if agent's reply contains 'TERMINATE', it will terminate.
+
+        Args:
+            message: the message to be processed.
+            tools: the tools to be used by the agent.
+            executor_kwargs: the keyword arguments for the executor.
+            max_turns: maximum number of turns (a turn is equivalent to both agents having replied), defaults no None which means unlimited. The original message is included.
+            msg_to: which agent is receiving the message and will be the first to reply, defaults to the agent.
+            clear_history: whether to clear the chat history.
+            user_input: the user will be asked for input at their turn.
+            summary_method: the method to summarize the chat.
+        """
+        with self._create_or_get_executor(
+            executor_kwargs=executor_kwargs,
+            tools=tools,
+            agent_name="user",
+            agent_human_input_mode="ALWAYS" if user_input else "NEVER",
+        ) as executor:
+            if msg_to == "agent":
+                return executor.initiate_chat(
+                    self,
+                    message=message,
+                    clear_history=clear_history,
+                    max_turns=max_turns,
+                    summary_method=summary_method,
+                )
+            else:
+                return self.initiate_chat(
+                    executor,
+                    message=message,
+                    clear_history=clear_history,
+                    max_turns=max_turns,
+                    summary_method=summary_method,
+                )
+
+    async def _deprecated_a_run(
+        self,
+        message: str,
+        *,
+        tools: Optional[Union[Tool, Iterable[Tool]]] = None,
+        executor_kwargs: Optional[dict[str, Any]] = None,
+        max_turns: Optional[int] = None,
+        msg_to: Literal["agent", "user"] = "agent",
+        clear_history: bool = False,
+        user_input: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = DEFAULT_SUMMARY_METHOD,
+    ) -> ChatResult:
+        """Run a chat asynchronously with the agent using the given message.
+
+        A second agent will be created to represent the user, this agent will by known by the name 'user'.
+
+        The user can terminate the conversation when prompted or, if agent's reply contains 'TERMINATE', it will terminate.
+
+        Args:
+            message: the message to be processed.
+            tools: the tools to be used by the agent.
+            executor_kwargs: the keyword arguments for the executor.
+            max_turns: maximum number of turns (a turn is equivalent to both agents having replied), defaults no None which means unlimited. The original message is included.
+            msg_to: which agent is receiving the message and will be the first to reply, defaults to the agent.
+            clear_history: whether to clear the chat history.
+            user_input: the user will be asked for input at their turn.
+            summary_method: the method to summarize the chat.
+        """
+        with self._create_or_get_executor(
+            executor_kwargs=executor_kwargs,
+            tools=tools,
+            agent_name="user",
+            agent_human_input_mode="ALWAYS" if user_input else "NEVER",
+        ) as executor:
+            if msg_to == "agent":
+                return await executor.a_initiate_chat(
+                    self,
+                    message=message,
+                    clear_history=clear_history,
+                    max_turns=max_turns,
+                    summary_method=summary_method,
+                )
+            else:
+                return await self.a_initiate_chat(
+                    executor,
+                    message=message,
+                    clear_history=clear_history,
+                    max_turns=max_turns,
+                    summary_method=summary_method,
+                )
+
+    def register_handoff(self, condition: Union["OnContextCondition", "OnCondition"]) -> None:
+        """
+        Register a single handoff condition (OnContextCondition or OnCondition).
+
+        Args:
+            condition: The condition to add (OnContextCondition, OnCondition)
+        """
+        self.handoffs.add(condition)
+
+    def register_handoffs(self, conditions: list[Union["OnContextCondition", "OnCondition"]]) -> None:
+        """
+        Register multiple handoff conditions (OnContextCondition or OnCondition).
+
+        Args:
+            conditions: List of conditions to add
+        """
+        self.handoffs.add_many(conditions)
+
+
+@export_module("autogen")
+def register_function(
+    f: Callable[..., Any],
+    *,
+    caller: ConversableAgent,
+    executor: ConversableAgent,
+    name: Optional[str] = None,
+    description: str,
+) -> None:
+    """Register a function to be proposed by an agent and executed for an executor.
+
+    This function can be used instead of function decorators `@ConversationAgent.register_for_llm` and
+    `@ConversationAgent.register_for_execution`.
+
+    Args:
+        f: the function to be registered.
+        caller: the agent calling the function, typically an instance of ConversableAgent.
+        executor: the agent executing the function, typically an instance of UserProxy.
+        name: name of the function. If None, the function name will be used (default: None).
+        description: description of the function. The description is used by LLM to decode whether the function
+            is called. Make sure the description is properly describing what the function does or it might not be
+            called by LLM when needed.
+
+    """
+    f = caller.register_for_llm(name=name, description=description)(f)
+    executor.register_for_execution(name=name)(f)
diff --git a/mm_agents/coact/autogen/agentchat/group/__init__.py b/mm_agents/coact/autogen/agentchat/group/__init__.py
new file mode 100644
index 0000000..4b95a59
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/__init__.py
@@ -0,0 +1,64 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+__all__: list[str] = []
+
+from .available_condition import ExpressionAvailableCondition, StringAvailableCondition
+from .context_condition import ExpressionContextCondition, StringContextCondition
+from .context_expression import ContextExpression
+from .context_str import ContextStr
+from .context_variables import ContextVariables
+from .handoffs import Handoffs
+from .llm_condition import ContextStrLLMCondition, StringLLMCondition
+from .on_condition import OnCondition
+from .on_context_condition import OnContextCondition
+from .reply_result import ReplyResult
+from .speaker_selection_result import SpeakerSelectionResult
+from .targets.group_chat_target import GroupChatConfig, GroupChatTarget
+
+"""
+from .targets.group_manager_target import (
+    GroupManagerSelectionMessageContextStr,
+    GroupManagerSelectionMessageString,
+    GroupManagerTarget,
+)
+"""
+from .targets.transition_target import (
+    AgentNameTarget,
+    AgentTarget,
+    AskUserTarget,
+    NestedChatTarget,
+    RevertToUserTarget,
+    StayTarget,
+    TerminateTarget,
+)
+
+__all__ = [
+    "AgentNameTarget",
+    "AgentTarget",
+    "AskUserTarget",
+    "ContextExpression",
+    "ContextStr",
+    "ContextStrLLMCondition",
+    "ContextVariables",
+    "ExpressionAvailableCondition",
+    "ExpressionContextCondition",
+    "GroupChatConfig",
+    "GroupChatTarget",
+    # "GroupManagerSelectionMessageContextStr",
+    # "GroupManagerSelectionMessageString",
+    # "GroupManagerTarget",
+    "Handoffs",
+    "NestedChatTarget",
+    "OnCondition",
+    "OnContextCondition",
+    "ReplyResult",
+    "RevertToUserTarget",
+    "SpeakerSelectionResult",
+    "StayTarget",
+    "StringAvailableCondition",
+    "StringContextCondition",
+    "StringLLMCondition",
+    "TerminateTarget",
+]
diff --git a/mm_agents/coact/autogen/agentchat/group/available_condition.py b/mm_agents/coact/autogen/agentchat/group/available_condition.py
new file mode 100644
index 0000000..3fbc871
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/available_condition.py
@@ -0,0 +1,91 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any
+
+from pydantic import BaseModel
+
+from .context_expression import ContextExpression
+
+if TYPE_CHECKING:
+    # Avoid circular import
+    from ..conversable_agent import ConversableAgent
+
+__all__ = ["AvailableCondition", "ExpressionAvailableCondition", "StringAvailableCondition"]
+
+
+class AvailableCondition(BaseModel):
+    """Protocol for determining if a condition is available to be evaluated."""
+
+    def is_available(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> bool:
+        """Determine if the condition should be considered for evaluation.
+
+        Args:
+            agent: The agent evaluating the condition
+            messages: The conversation history
+
+        Returns:
+            True if the condition should be evaluated, False otherwise
+        """
+        raise NotImplementedError("Requires subclasses to implement.")
+
+
+class StringAvailableCondition(AvailableCondition):
+    """String-based available condition.
+
+    This condition checks if a named context variable exists and is truthy.
+    """
+
+    context_variable: str
+
+    def __init__(self, context_variable: str, **data: Any) -> None:
+        """Initialize with a context variable name as a positional parameter.
+
+        Args:
+            context_variable: The name of the context variable to check
+            data: Additional data for the parent class
+        """
+        super().__init__(context_variable=context_variable, **data)
+
+    def is_available(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> bool:
+        """Check if the named context variable is truthy.
+
+        Args:
+            agent: The agent with context variables
+            messages: The conversation history (not used)
+
+        Returns:
+            True if the variable exists and is truthy, False otherwise
+        """
+        return bool(agent.context_variables.get(self.context_variable, False))
+
+
+class ExpressionAvailableCondition(AvailableCondition):
+    """Expression-based available condition.
+
+    This condition evaluates a ContextExpression against the context variables.
+    """
+
+    expression: ContextExpression
+
+    def __init__(self, expression: ContextExpression, **data: Any) -> None:
+        """Initialize with an expression as a positional parameter.
+
+        Args:
+            expression: The context expression to evaluate
+            data: Additional data for the parent class
+        """
+        super().__init__(expression=expression, **data)
+
+    def is_available(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> bool:
+        """Evaluate the expression against the context variables.
+
+        Args:
+            agent: The agent with context variables
+            messages: The conversation history (not used)
+
+        Returns:
+            Boolean result of the expression evaluation
+        """
+        return self.expression.evaluate(agent.context_variables)
diff --git a/mm_agents/coact/autogen/agentchat/group/context_condition.py b/mm_agents/coact/autogen/agentchat/group/context_condition.py
new file mode 100644
index 0000000..9a4b495
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/context_condition.py
@@ -0,0 +1,77 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+from typing import Any
+
+from pydantic import BaseModel
+
+from .context_expression import ContextExpression
+from .context_variables import ContextVariables
+
+__all__ = ["ContextCondition", "ExpressionContextCondition", "StringContextCondition"]
+
+
+class ContextCondition(BaseModel):
+    """Protocol for conditions evaluated directly using context variables."""
+
+    def evaluate(self, context_variables: ContextVariables) -> bool:
+        """Evaluate the condition to a boolean result.
+
+        Args:
+            context_variables: The context variables to evaluate against
+
+        Returns:
+            Boolean result of the condition evaluation
+        """
+        raise NotImplementedError("Requires subclasses to implement.")
+
+
+class StringContextCondition(ContextCondition):
+    """Simple string-based context condition.
+
+    This condition checks if a named context variable exists and is truthy.
+    """
+
+    variable_name: str
+
+    def evaluate(self, context_variables: ContextVariables) -> bool:
+        """Check if the named context variable is truthy.
+
+        Args:
+            context_variables: The context variables to check against
+
+        Returns:
+            True if the variable exists and is truthy, False otherwise
+        """
+        return bool(context_variables.get(self.variable_name, False))
+
+
+class ExpressionContextCondition(ContextCondition):
+    """Complex expression-based context condition.
+
+    This condition evaluates a ContextExpression against the context variables.
+    """
+
+    expression: ContextExpression
+
+    def __init__(self, expression: ContextExpression, **data: Any) -> None:
+        """Initialize with an expression as a positional parameter.
+
+        Args:
+            expression: The context expression to evaluate
+            data: Additional data for the parent class
+        """
+        super().__init__(expression=expression, **data)
+
+    def evaluate(self, context_variables: ContextVariables) -> bool:
+        """Evaluate the expression against the context variables.
+
+        Args:
+            context_variables: The context variables to evaluate against
+
+        Returns:
+            Boolean result of the expression evaluation
+        """
+        return self.expression.evaluate(context_variables)
diff --git a/mm_agents/coact/autogen/agentchat/group/context_expression.py b/mm_agents/coact/autogen/agentchat/group/context_expression.py
new file mode 100644
index 0000000..64f2052
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/context_expression.py
@@ -0,0 +1,238 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import ast
+import re
+from dataclasses import dataclass
+
+from ...doc_utils import export_module
+from .context_variables import ContextVariables
+
+
+@dataclass
+@export_module("autogen")
+class ContextExpression:
+    """A class to evaluate logical expressions using context variables.
+
+    Args:
+        expression (str): A string containing a logical expression with context variable references.
+            - Variable references use ${var_name} syntax: ${logged_in}, ${attempts}
+            - String literals can use normal quotes: 'hello', "world"
+            - Supported operators:
+                - Logical: not/!, and/&, or/|
+                - Comparison: >, <, >=, <=, ==, !=
+            - Supported functions:
+                - len(${var_name}): Gets the length of a list, string, or other collection
+            - Parentheses can be used for grouping
+            - Examples:
+                - "not ${logged_in} and ${is_admin} or ${guest_checkout}"
+                - "!${logged_in} & ${is_admin} | ${guest_checkout}"
+                - "len(${orders}) > 0 & ${user_active}"
+                - "len(${cart_items}) == 0 | ${checkout_started}"
+
+    Raises:
+        SyntaxError: If the expression cannot be parsed
+        ValueError: If the expression contains disallowed operations
+    """
+
+    expression: str
+
+    def __post_init__(self) -> None:
+        # Validate the expression immediately upon creation
+        try:
+            # Extract variable references and replace with placeholders
+            self._variable_names = self._extract_variable_names(self.expression)
+
+            # Convert symbolic operators to Python keywords
+            python_expr = self._convert_to_python_syntax(self.expression)
+
+            # Sanitize for AST parsing
+            sanitized_expr = self._prepare_for_ast(python_expr)
+
+            # Use ast to parse and validate the expression
+            self._ast = ast.parse(sanitized_expr, mode="eval")
+
+            # Verify it only contains allowed operations
+            self._validate_operations(self._ast.body)
+
+            # Store the Python-syntax version for evaluation
+            self._python_expr = python_expr
+
+        except SyntaxError as e:
+            raise SyntaxError(f"Invalid expression syntax in '{self.expression}': {str(e)}")
+        except Exception as e:
+            raise ValueError(f"Error validating expression '{self.expression}': {str(e)}")
+
+    def _extract_variable_names(self, expr: str) -> list[str]:
+        """Extract all variable references ${var_name} from the expression."""
+        # Find all patterns like ${var_name}
+        matches = re.findall(r"\${([^}]*)}", expr)
+        return matches
+
+    def _convert_to_python_syntax(self, expr: str) -> str:
+        """Convert symbolic operators to Python keywords."""
+        # We need to be careful about operators inside string literals
+        # First, temporarily replace string literals with placeholders
+        string_literals = []
+
+        def replace_string_literal(match: re.Match[str]) -> str:
+            string_literals.append(match.group(0))
+            return f"__STRING_LITERAL_{len(string_literals) - 1}__"
+
+        # Replace both single and double quoted strings
+        expr_without_strings = re.sub(r"'[^']*'|\"[^\"]*\"", replace_string_literal, expr)
+
+        # Handle the NOT operator (!) - no parentheses handling needed
+        # Replace standalone ! before variables or expressions
+        expr_without_strings = re.sub(r"!\s*(\${|\()", "not \\1", expr_without_strings)
+
+        # Handle AND and OR operators - simpler approach without parentheses handling
+        expr_without_strings = re.sub(r"\s+&\s+", " and ", expr_without_strings)
+        expr_without_strings = re.sub(r"\s+\|\s+", " or ", expr_without_strings)
+
+        # Now put string literals back
+        for i, literal in enumerate(string_literals):
+            expr_without_strings = expr_without_strings.replace(f"__STRING_LITERAL_{i}__", literal)
+
+        return expr_without_strings
+
+    def _prepare_for_ast(self, expr: str) -> str:
+        """Convert the expression to valid Python for AST parsing by replacing variables with placeholders."""
+        # Replace ${var_name} with var_name for AST parsing
+        processed_expr = expr
+        for var_name in self._variable_names:
+            processed_expr = processed_expr.replace(f"${{{var_name}}}", var_name)
+
+        return processed_expr
+
+    def _validate_operations(self, node: ast.AST) -> None:
+        """Recursively validate that only allowed operations exist in the AST."""
+        allowed_node_types = (
+            # Boolean operations
+            ast.BoolOp,
+            ast.UnaryOp,
+            ast.And,
+            ast.Or,
+            ast.Not,
+            # Comparison operations
+            ast.Compare,
+            ast.Eq,
+            ast.NotEq,
+            ast.Lt,
+            ast.LtE,
+            ast.Gt,
+            ast.GtE,
+            # Basic nodes
+            ast.Name,
+            ast.Load,
+            ast.Constant,
+            ast.Expression,
+            # Support for basic numeric operations in comparisons
+            ast.Num,
+            ast.NameConstant,
+            # Support for negative numbers
+            ast.USub,
+            ast.UnaryOp,
+            # Support for string literals
+            ast.Str,
+            ast.Constant,
+            # Support for function calls (specifically len())
+            ast.Call,
+        )
+
+        if not isinstance(node, allowed_node_types):
+            raise ValueError(f"Operation type {type(node).__name__} is not allowed in logical expressions")
+
+        # Special validation for function calls - only allow len()
+        if isinstance(node, ast.Call):
+            if not (isinstance(node.func, ast.Name) and node.func.id == "len"):
+                raise ValueError(f"Only the len() function is allowed, got: {getattr(node.func, 'id', 'unknown')}")
+            if len(node.args) != 1:
+                raise ValueError(f"len() function must have exactly one argument, got {len(node.args)}")
+
+        # Special validation for Compare nodes
+        if isinstance(node, ast.Compare):
+            for op in node.ops:
+                if not isinstance(op, (ast.Eq, ast.NotEq, ast.Lt, ast.LtE, ast.Gt, ast.GtE)):
+                    raise ValueError(f"Comparison operator {type(op).__name__} is not allowed")
+
+        # Recursively check child nodes
+        for child in ast.iter_child_nodes(node):
+            self._validate_operations(child)
+
+    def evaluate(self, context_variables: ContextVariables) -> bool:
+        """Evaluate the expression using the provided context variables.
+
+        Args:
+            context_variables: Dictionary of context variables to use for evaluation
+
+        Returns:
+            bool: The result of evaluating the expression
+
+        Raises:
+            KeyError: If a variable referenced in the expression is not found in the context
+        """
+        # Create a modified expression that we can safely evaluate
+        eval_expr = self._python_expr  # Use the Python-syntax version
+
+        # First, handle len() functions with variable references inside
+        len_pattern = r"len\(\${([^}]*)}\)"
+        len_matches = list(re.finditer(len_pattern, eval_expr))
+
+        # Process all len() operations first
+        for match in len_matches:
+            var_name = match.group(1)
+            # Check if variable exists in context, raise KeyError if not
+            if not context_variables.contains(var_name):
+                raise KeyError(f"Missing context variable: '{var_name}'")
+
+            var_value = context_variables.get(var_name)
+
+            # Calculate the length - works for lists, strings, dictionaries, etc.
+            try:
+                length_value = len(var_value)  # type: ignore[arg-type]
+            except TypeError:
+                # If the value doesn't support len(), treat as 0
+                length_value = 0
+
+            # Replace the len() expression with the actual length
+            full_match = match.group(0)
+            eval_expr = eval_expr.replace(full_match, str(length_value))
+
+        # Then replace remaining variable references with their values
+        for var_name in self._variable_names:
+            # Skip variables that were already processed in len() expressions
+            if any(m.group(1) == var_name for m in len_matches):
+                continue
+
+            # Check if variable exists in context, raise KeyError if not
+            if not context_variables.contains(var_name):
+                raise KeyError(f"Missing context variable: '{var_name}'")
+
+            # Get the value from context
+            var_value = context_variables.get(var_name)
+
+            # Format the value appropriately based on its type
+            if isinstance(var_value, (bool, int, float)):
+                formatted_value = str(var_value)
+            elif isinstance(var_value, str):
+                formatted_value = f"'{var_value}'"  # Quote strings
+            elif isinstance(var_value, (list, dict, tuple)):
+                # For collections, convert to their boolean evaluation
+                formatted_value = str(bool(var_value))
+            else:
+                formatted_value = str(var_value)
+
+            # Replace the variable reference with the formatted value
+            eval_expr = eval_expr.replace(f"${{{var_name}}}", formatted_value)
+
+        try:
+            return eval(eval_expr)  # type: ignore[no-any-return]
+        except Exception as e:
+            raise ValueError(
+                f"Error evaluating expression '{self.expression}' (are you sure you're using ${{my_context_variable_key}}): {str(e)}"
+            )
+
+    def __str__(self) -> str:
+        return f"ContextExpression('{self.expression}')"
diff --git a/mm_agents/coact/autogen/agentchat/group/context_str.py b/mm_agents/coact/autogen/agentchat/group/context_str.py
new file mode 100644
index 0000000..2c42d83
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/context_str.py
@@ -0,0 +1,41 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Optional
+
+from pydantic import BaseModel
+
+from .context_variables import ContextVariables
+
+__all__ = ["ContextStr"]
+
+
+class ContextStr(BaseModel):
+    """A string that requires context variable substitution.
+
+    Use the format method to substitute context variables into the string.
+    """
+
+    """The string to be substituted with context variables. It is expected that the string will contain `{var}` placeholders and that string format will be able to replace all values."""
+    template: str
+
+    def format(self, context_variables: ContextVariables) -> Optional[str]:
+        """Substitute context variables into the string.
+
+        Args:
+            context_variables (ContextVariables): The context variables to substitute into the string.
+
+        Returns:
+            Optional[str]: The formatted string with context variables substituted.
+        """
+
+        context = context_variables.to_dict()
+
+        if not context:
+            return self.template
+
+        return self.template.format(**context)
+
+    def __str__(self) -> str:
+        return f"ContextStr, unformatted: {self.template}"
diff --git a/mm_agents/coact/autogen/agentchat/group/context_variables.py b/mm_agents/coact/autogen/agentchat/group/context_variables.py
new file mode 100644
index 0000000..4ef8fef
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/context_variables.py
@@ -0,0 +1,192 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Generator, Iterable, Optional
+
+from pydantic import BaseModel, Field
+
+__all__ = ["ContextVariables"]
+
+# Parameter name for context variables
+# Use the value in functions and they will be substituted with the context variables:
+# e.g. def my_function(context_variables: ContextVariables, my_other_parameters: Any) -> Any:
+__CONTEXT_VARIABLES_PARAM_NAME__ = "context_variables"
+
+
+class ContextVariables(BaseModel):
+    """
+    Stores and manages context variables for agentic workflows.
+
+    Utilises a dictionary-like interface for setting, getting, and removing variables.
+    """
+
+    # Internal storage for context variables
+    data: dict[str, Any] = Field(default_factory=dict)
+
+    def __init__(self, data: Optional[dict[str, Any]] = None, **kwargs: Any) -> None:
+        """Initialize with data dictionary as an optional positional parameter.
+
+        Args:
+            data: Initial dictionary of context variables (optional)
+            kwargs: Additional keyword arguments for the parent class
+        """
+        init_data = data or {}
+        super().__init__(data=init_data, **kwargs)
+
+    def get(self, key: str, default: Optional[Any] = None) -> Optional[Any]:
+        """
+        Get a value from the context by key.
+
+        Args:
+            key: The key to retrieve
+            default: The default value to return if key is not found
+
+        Returns:
+            The value associated with the key or default if not found
+        """
+        return self.data.get(key, default)
+
+    def set(self, key: str, value: Any) -> None:
+        """
+        Set a value in the context by key.
+
+        Args:
+            key: The key to set
+            value: The value to store
+        """
+        self.data[key] = value
+
+    def remove(self, key: str) -> bool:
+        """
+        Remove a key from the context.
+
+        Args:
+            key: The key to remove
+
+        Returns:
+            True if the key was removed, False if it didn't exist
+        """
+        if key in self.data:
+            del self.data[key]
+            return True
+        return False
+
+    def keys(self) -> Iterable[str]:
+        """
+        Get all keys in the context.
+
+        Returns:
+            An iterable of all keys
+        """
+        return self.data.keys()
+
+    def values(self) -> Iterable[Any]:
+        """
+        Get all values in the context.
+
+        Returns:
+            An iterable of all values
+        """
+        return self.data.values()
+
+    def items(self) -> Iterable[tuple[str, Any]]:
+        """
+        Get all key-value pairs in the context.
+
+        Returns:
+            An iterable of all key-value pairs
+        """
+        return self.data.items()
+
+    def clear(self) -> None:
+        """Clear all keys and values from the context."""
+        self.data.clear()
+
+    def contains(self, key: str) -> bool:
+        """
+        Check if a key exists in the context.
+
+        Args:
+            key: The key to check
+
+        Returns:
+            True if the key exists, False otherwise
+        """
+        return key in self.data
+
+    def update(self, other: dict[str, Any]) -> None:
+        """
+        Update context with key-value pairs from another dictionary.
+
+        Args:
+            other: Dictionary containing key-value pairs to add
+        """
+        self.data.update(other)
+
+    def to_dict(self) -> dict[str, Any]:
+        """
+        Convert context variables to a dictionary.
+
+        Returns:
+            Dictionary representation of all context variables
+        """
+        return self.data.copy()
+
+    # Dictionary-compatible interface
+    def __getitem__(self, key: str) -> Any:
+        """Get a value using dictionary syntax: context[key]"""
+        try:
+            return self.data[key]
+        except KeyError:
+            raise KeyError(f"Context variable '{key}' not found")
+
+    def __setitem__(self, key: str, value: Any) -> None:
+        """Set a value using dictionary syntax: context[key] = value"""
+        self.data[key] = value
+
+    def __delitem__(self, key: str) -> None:
+        """Delete a key using dictionary syntax: del context[key]"""
+        try:
+            del self.data[key]
+        except KeyError:
+            raise KeyError(f"Cannot delete non-existent context variable '{key}'")
+
+    def __contains__(self, key: str) -> bool:
+        """Check if key exists using 'in' operator: key in context"""
+        return key in self.data
+
+    def __len__(self) -> int:
+        """Get the number of items: len(context)"""
+        return len(self.data)
+
+    def __iter__(self) -> Generator[tuple[str, Any], None, None]:
+        """Iterate over keys: for key in context"""
+        for key in self.data:
+            yield (key, self.data[key])
+
+    def __str__(self) -> str:
+        """String representation of context variables."""
+        return f"ContextVariables({self.data})"
+
+    def __repr__(self) -> str:
+        """Detailed representation of context variables."""
+        return f"ContextVariables(data={self.data!r})"
+
+    # Utility methods
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "ContextVariables":
+        """
+        Create a new ContextVariables instance from a dictionary.
+
+        E.g.:
+        my_context = {"user_id": "12345", "settings": {"theme": "dark"}}
+        context = ContextVariables.from_dict(my_context)
+
+        Args:
+            data: Dictionary of key-value pairs
+
+        Returns:
+            New ContextVariables instance
+        """
+        return cls(data=data)
diff --git a/mm_agents/coact/autogen/agentchat/group/group_tool_executor.py b/mm_agents/coact/autogen/agentchat/group/group_tool_executor.py
new file mode 100644
index 0000000..1f50e09
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/group_tool_executor.py
@@ -0,0 +1,202 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import inspect
+from copy import deepcopy
+from typing import Annotated, Any, Callable, Optional
+
+from ...oai import OpenAIWrapper
+from ...tools import Depends, Tool
+from ...tools.dependency_injection import inject_params, on
+from ..agent import Agent
+from ..conversable_agent import ConversableAgent
+from .context_variables import __CONTEXT_VARIABLES_PARAM_NAME__, ContextVariables
+from .reply_result import ReplyResult
+from .targets.transition_target import TransitionTarget
+
+__TOOL_EXECUTOR_NAME__ = "_Group_Tool_Executor"
+
+
+class GroupToolExecutor(ConversableAgent):
+    """Tool executor for the group chat initiated with initiate_group_chat"""
+
+    def __init__(self) -> None:
+        super().__init__(
+            name=__TOOL_EXECUTOR_NAME__,
+            system_message="Tool Execution, do not use this agent directly.",
+            human_input_mode="NEVER",
+            code_execution_config=False,
+        )
+
+        # Store the next target from a tool call
+        self._group_next_target: Optional[TransitionTarget] = None
+
+        # Primary tool reply function for handling the tool reply and the ReplyResult and TransitionTarget returns
+        self.register_reply([Agent, None], self._generate_group_tool_reply, remove_other_reply_funcs=True)
+
+    def set_next_target(self, next_target: TransitionTarget) -> None:
+        """Sets the next target to transition to, used in the determine_next_agent function."""
+        self._group_next_target = next_target
+
+    def get_next_target(self) -> TransitionTarget:
+        """Gets the next target to transition to."""
+        """Returns the next target to transition to, if it exists."""
+        if self._group_next_target is None:
+            raise ValueError(
+                "No next target set. Please set a next target before calling this method. Use has_next_target() to check if a next target exists."
+            )
+        return self._group_next_target
+
+    def has_next_target(self) -> bool:
+        """Checks if there is a next target to transition to."""
+        return self._group_next_target is not None
+
+    def clear_next_target(self) -> None:
+        """Clears the next target to transition to."""
+        self._group_next_target = None
+
+    def _modify_context_variables_param(
+        self, f: Callable[..., Any], context_variables: ContextVariables
+    ) -> Callable[..., Any]:
+        """Modifies the context_variables parameter to use dependency injection and link it to the group context variables.
+
+        This essentially changes:
+        def some_function(some_variable: int, context_variables: ContextVariables) -> str:
+
+        to:
+
+        def some_function(some_variable: int, context_variables: Annotated[ContextVariables, Depends(on(self.context_variables))]) -> str:
+        """
+        sig = inspect.signature(f)
+
+        # Check if context_variables parameter exists and update it if so
+        if __CONTEXT_VARIABLES_PARAM_NAME__ in sig.parameters:
+            new_params = []
+            for name, param in sig.parameters.items():
+                if name == __CONTEXT_VARIABLES_PARAM_NAME__:
+                    # Replace with new annotation using Depends
+                    new_param = param.replace(annotation=Annotated[ContextVariables, Depends(on(context_variables))])
+                    new_params.append(new_param)
+                else:
+                    new_params.append(param)
+
+            # Update signature
+            new_sig = sig.replace(parameters=new_params)
+            f.__signature__ = new_sig  # type: ignore[attr-defined]
+
+        return f
+
+    def _change_tool_context_variables_to_depends(
+        self, agent: ConversableAgent, current_tool: Tool, context_variables: ContextVariables
+    ) -> None:
+        """Checks for the context_variables parameter in the tool and updates it to use dependency injection."""
+
+        # If the tool has a context_variables parameter, remove the tool and reregister it without the parameter
+        if __CONTEXT_VARIABLES_PARAM_NAME__ in current_tool.tool_schema["function"]["parameters"]["properties"]:
+            # We'll replace the tool, so start with getting the underlying function
+            tool_func = current_tool._func
+
+            # Remove the Tool from the agent
+            name = current_tool._name
+            description = current_tool._description
+            agent.remove_tool_for_llm(current_tool)
+
+            # Recreate the tool without the context_variables parameter
+            tool_func = self._modify_context_variables_param(current_tool._func, context_variables)
+            tool_func = inject_params(tool_func)
+            new_tool = ConversableAgent._create_tool_if_needed(
+                func_or_tool=tool_func, name=name, description=description
+            )
+
+            # Re-register with the agent
+            agent.register_for_llm()(new_tool)
+
+    def register_agents_functions(self, agents: list[ConversableAgent], context_variables: ContextVariables) -> None:
+        """Adds the functions of the agents to the group tool executor."""
+        for agent in agents:
+            # As we're moving towards tools and away from function maps, this may not be used
+            self._function_map.update(agent._function_map)
+
+            # Update any agent tools that have context_variables parameters to use Dependency Injection
+            for tool in agent.tools:
+                self._change_tool_context_variables_to_depends(agent, tool, context_variables)
+
+            # Add all tools to the Tool Executor agent
+            for tool in agent.tools:
+                self.register_for_execution(serialize=False, silent_override=True)(tool)
+
+    def _generate_group_tool_reply(
+        self,
+        agent: ConversableAgent,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[OpenAIWrapper] = None,
+    ) -> tuple[bool, Optional[dict[str, Any]]]:
+        """Pre-processes and generates tool call replies.
+
+        This function:
+        1. Adds context_variables back to the tool call for the function, if necessary.
+        2. Generates the tool calls reply.
+        3. Updates context_variables and next_agent based on the tool call response."""
+
+        if config is None:
+            config = agent  # type: ignore[assignment]
+        if messages is None:
+            messages = agent._oai_messages[sender]
+
+        message = messages[-1]
+        if "tool_calls" in message:
+            tool_call_count = len(message["tool_calls"])
+
+            # Loop through tool calls individually (so context can be updated after each function call)
+            next_target: Optional[TransitionTarget] = None
+            tool_responses_inner = []
+            contents = []
+            for index in range(tool_call_count):
+                message_copy = deepcopy(message)
+
+                # 1. add context_variables to the tool call arguments
+                tool_call = message_copy["tool_calls"][index]
+
+                # Ensure we are only executing the one tool at a time
+                message_copy["tool_calls"] = [tool_call]
+
+                # 2. generate tool calls reply
+                _, tool_message = agent.generate_tool_calls_reply([message_copy])
+
+                if tool_message is None:
+                    raise ValueError("Tool call did not return a message")
+
+                # 3. update context_variables and next_agent, convert content to string
+                for tool_response in tool_message["tool_responses"]:
+                    content = tool_response.get("content")
+
+                    # Tool Call returns that are a target are either a ReplyResult or a TransitionTarget are the next agent
+                    if isinstance(content, ReplyResult):
+                        if content.context_variables and content.context_variables.to_dict() != {}:
+                            agent.context_variables.update(content.context_variables.to_dict())
+                        if content.target is not None:
+                            next_target = content.target
+                    elif isinstance(content, TransitionTarget):
+                        next_target = content
+
+                    # Serialize the content to a string
+                    if content is not None:
+                        tool_response["content"] = str(content)
+
+                    tool_responses_inner.append(tool_response)
+                    contents.append(str(tool_response["content"]))
+
+            self._group_next_target = next_target  # type: ignore[attr-defined]
+
+            # Put the tool responses and content strings back into the response message
+            # Caters for multiple tool calls
+            if tool_message is None:
+                raise ValueError("Tool call did not return a message")
+
+            tool_message["tool_responses"] = tool_responses_inner
+            tool_message["content"] = "\n".join(contents)
+
+            return True, tool_message
+        return False, None
diff --git a/mm_agents/coact/autogen/agentchat/group/group_utils.py b/mm_agents/coact/autogen/agentchat/group/group_utils.py
new file mode 100644
index 0000000..beef771
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/group_utils.py
@@ -0,0 +1,636 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import copy
+from functools import partial
+from types import MethodType
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+
+from ..agent import Agent
+from ..groupchat import GroupChat, GroupChatManager
+from .context_variables import ContextVariables
+from .group_tool_executor import GroupToolExecutor
+from .targets.group_manager_target import GroupManagerTarget
+from .targets.transition_target import (
+    AgentNameTarget,
+    AgentTarget,
+    TransitionTarget,
+)
+
+if TYPE_CHECKING:
+    from ..conversable_agent import ConversableAgent
+
+# Utility functions for group chat preparation and management
+# These are extracted from multi_agent_chat.py to avoid circular imports
+
+
+def update_conditional_functions(agent: "ConversableAgent", messages: list[dict[str, Any]]) -> None:
+    """Updates the agent's functions based on the OnCondition's available condition.
+
+    All functions are removed and then added back if they are available
+    """
+    for on_condition in agent.handoffs.llm_conditions:
+        is_available = on_condition.available.is_available(agent, messages) if on_condition.available else True
+
+        # Remove it from their tools
+        for tool in agent.tools:
+            if tool.name == on_condition.llm_function_name:
+                agent.remove_tool_for_llm(tool)
+                break
+
+        # then add the function if it is available, so that the function signature is updated
+        if is_available:
+            agent._add_single_function(
+                _create_on_condition_handoff_function(on_condition.target),
+                on_condition.llm_function_name,
+                on_condition.condition.get_prompt(agent, messages),
+            )
+
+
+def establish_group_agent(agent: "ConversableAgent") -> None:
+    """Establish the group agent with the group-related attributes and hooks. Not for the tool executor.
+
+    Args:
+        agent ("ConversableAgent"): The agent to establish as a group agent.
+    """
+
+    def _group_agent_str(self: "ConversableAgent") -> str:
+        """Customise the __str__ method to show the agent name for transition messages."""
+        return f"Group agent --> {self.name}"
+
+    # Register the hook to update agent state (except tool executor)
+    agent.register_hook("update_agent_state", update_conditional_functions)
+
+    # Register a reply function to run Python function-based OnContextConditions before any other reply function
+    agent.register_reply(trigger=([Agent, None]), reply_func=_run_oncontextconditions, position=0)
+
+    agent._get_display_name = MethodType(_group_agent_str, agent)  # type: ignore[method-assign]
+
+    # Mark this agent as established as a group agent
+    agent._group_is_established = True  # type: ignore[attr-defined]
+
+
+def link_agents_to_group_manager(agents: list[Agent], group_chat_manager: Agent) -> None:
+    """Link all agents to the GroupChatManager so they can access the underlying GroupChat and other agents.
+
+    This is primarily used so that agents can get to the tool executor to help set the next agent.
+
+    Does not link the Tool Executor agent.
+    """
+    for agent in agents:
+        agent._group_manager = group_chat_manager  # type: ignore[attr-defined]
+
+
+def _evaluate_after_works_conditions(
+    agent: "ConversableAgent",
+    groupchat: GroupChat,
+    user_agent: Optional["ConversableAgent"],
+) -> Optional[Union[Agent, str]]:
+    """Evaluate after_works context conditions for an agent.
+
+    Args:
+        agent: The agent to evaluate after_works conditions for
+        groupchat: The current group chat
+        user_agent: Optional user proxy agent
+
+    Returns:
+        The resolved speaker selection result if a condition matches, None otherwise
+    """
+    if not hasattr(agent, "handoffs") or not agent.handoffs.after_works:  # type: ignore[attr-defined]
+        return None
+
+    for after_work_condition in agent.handoffs.after_works:  # type: ignore[attr-defined]
+        # Check if condition is available
+        is_available = (
+            after_work_condition.available.is_available(agent, groupchat.messages)
+            if after_work_condition.available
+            else True
+        )
+
+        # Evaluate the condition (None condition means always true)
+        if is_available and (
+            after_work_condition.condition is None or after_work_condition.condition.evaluate(agent.context_variables)
+        ):
+            # Condition matched, resolve and return
+            return after_work_condition.target.resolve(
+                groupchat,
+                agent,
+                user_agent,
+            ).get_speaker_selection_result(groupchat)
+
+    return None
+
+
+def _run_oncontextconditions(
+    agent: "ConversableAgent",
+    messages: Optional[list[dict[str, Any]]] = None,
+    sender: Optional[Agent] = None,
+    config: Optional[Any] = None,
+) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+    """Run OnContextConditions for an agent before any other reply function."""
+    for on_condition in agent.handoffs.context_conditions:  # type: ignore[attr-defined]
+        is_available = (
+            on_condition.available.is_available(agent, messages if messages else []) if on_condition.available else True
+        )
+
+        if is_available and (
+            on_condition.condition is None or on_condition.condition.evaluate(agent.context_variables)
+        ):
+            # Condition has been met, we'll set the Tool Executor's next target
+            # attribute and that will be picked up on the next iteration when
+            # _determine_next_agent is called
+            for agent in agent._group_manager.groupchat.agents:  # type: ignore[attr-defined]
+                if isinstance(agent, GroupToolExecutor):
+                    agent.set_next_target(on_condition.target)
+                    break
+
+            transfer_name = on_condition.target.display_name()
+
+            return True, "[Handing off to " + transfer_name + "]"
+
+    return False, None
+
+
+def _create_on_condition_handoff_function(target: TransitionTarget) -> Callable[[], TransitionTarget]:
+    """Creates a function that will be used by the tool call reply function when the condition is met.
+
+    Args:
+        target (TransitionTarget): The target to transfer to.
+
+    Returns:
+        Callable: The transfer function.
+    """
+
+    def transfer_to_target() -> TransitionTarget:
+        return target
+
+    return transfer_to_target
+
+
+def create_on_condition_handoff_functions(agent: "ConversableAgent") -> None:
+    """Creates the functions for the OnConditions so that the current tool handling works.
+
+    Args:
+        agent ("ConversableAgent"): The agent to create the functions for.
+    """
+    # Populate the function names for the handoffs
+    agent.handoffs.set_llm_function_names()
+
+    # Create a function for each OnCondition
+    for on_condition in agent.handoffs.llm_conditions:
+        # Create a function that will be called when the condition is met
+        agent._add_single_function(
+            _create_on_condition_handoff_function(on_condition.target),
+            on_condition.llm_function_name,
+            on_condition.condition.get_prompt(agent, []),
+        )
+
+
+def ensure_handoff_agents_in_group(agents: list["ConversableAgent"]) -> None:
+    """Ensure the agents in handoffs are in the group chat."""
+    agent_names = [agent.name for agent in agents]
+    for agent in agents:
+        for llm_conditions in agent.handoffs.llm_conditions:
+            if (
+                isinstance(llm_conditions.target, (AgentTarget, AgentNameTarget))
+                and llm_conditions.target.agent_name not in agent_names
+            ):
+                raise ValueError("Agent in OnCondition Hand-offs must be in the agents list")
+        for context_conditions in agent.handoffs.context_conditions:
+            if (
+                isinstance(context_conditions.target, (AgentTarget, AgentNameTarget))
+                and context_conditions.target.agent_name not in agent_names
+            ):
+                raise ValueError("Agent in OnContextCondition Hand-offs must be in the agents list")
+        # Check after_works targets
+        for after_work_condition in agent.handoffs.after_works:
+            if (
+                isinstance(after_work_condition.target, (AgentTarget, AgentNameTarget))
+                and after_work_condition.target.agent_name not in agent_names
+            ):
+                raise ValueError("Agent in after work target Hand-offs must be in the agents list")
+
+
+def prepare_exclude_transit_messages(agents: list["ConversableAgent"]) -> None:
+    """Preparation for excluding transit messages by getting all tool names and registering a hook on agents to remove those messages."""
+    # get all transit functions names
+    to_be_removed: list[str] = []
+    for agent in agents:
+        for on_condition in agent.handoffs.llm_conditions:
+            if on_condition.llm_function_name:
+                to_be_removed.append(on_condition.llm_function_name)
+            else:
+                raise ValueError("OnCondition must have a function name")
+
+    remove_function = make_remove_function(to_be_removed)
+
+    # register hook to remove transit messages for group agents
+    for agent in agents:
+        agent.register_hook("process_all_messages_before_reply", remove_function)
+
+
+def prepare_group_agents(
+    agents: list["ConversableAgent"],
+    context_variables: ContextVariables,
+    exclude_transit_message: bool = True,
+) -> tuple[GroupToolExecutor, list["ConversableAgent"]]:
+    """Validates agents, create the tool executor, wrap necessary targets in agents.
+
+    Args:
+        agents (list["ConversableAgent"]): List of all agents in the conversation.
+        context_variables (ContextVariables): Context variables to assign to all agents.
+        exclude_transit_message (bool): Whether to exclude transit messages from the agents.
+
+    Returns:
+        "ConversableAgent": The tool executor agent.
+        list["ConversableAgent"]: List of wrapped agents.
+    """
+    # Initialise all agents as group agents
+    for agent in agents:
+        if not hasattr(agent, "_group_is_established"):
+            establish_group_agent(agent)
+
+    # Ensure all agents in hand-off after-works are in the passed in agents list
+    ensure_handoff_agents_in_group(agents)
+
+    # Create Tool Executor for the group
+    tool_execution = GroupToolExecutor()
+
+    # Wrap handoff targets in agents that need to be wrapped
+    wrapped_chat_agents: list["ConversableAgent"] = []
+    for agent in agents:
+        wrap_agent_handoff_targets(agent, wrapped_chat_agents)
+
+    # Create the functions for the OnConditions so that the current tool handling works
+    for agent in agents:
+        create_on_condition_handoff_functions(agent)
+
+    # Register all the agents' functions with the tool executor and
+    # use dependency injection for the context variables parameter
+    # Update tool execution agent with all the functions from all the agents
+    tool_execution.register_agents_functions(agents + wrapped_chat_agents, context_variables)
+
+    if exclude_transit_message:
+        prepare_exclude_transit_messages(agents)
+
+    return tool_execution, wrapped_chat_agents
+
+
+def wrap_agent_handoff_targets(agent: "ConversableAgent", wrapped_agent_list: list["ConversableAgent"]) -> None:
+    """Wrap handoff targets in agents that need to be wrapped to be part of the group chat.
+
+    Example is NestedChatTarget.
+
+    Args:
+        agent ("ConversableAgent"): The agent to wrap the handoff targets for.
+        wrapped_agent_list (list["ConversableAgent"]): List of wrapped chat agents that will be appended to.
+    """
+    # Wrap OnCondition targets
+    for i, handoff_oncondition_requiring_wrapping in enumerate(agent.handoffs.get_llm_conditions_requiring_wrapping()):
+        # Create wrapper agent
+        wrapper_agent = handoff_oncondition_requiring_wrapping.target.create_wrapper_agent(parent_agent=agent, index=i)
+        wrapped_agent_list.append(wrapper_agent)
+
+        # Change this handoff target to point to the newly created agent
+        handoff_oncondition_requiring_wrapping.target = AgentTarget(wrapper_agent)
+
+    for i, handoff_oncontextcondition_requiring_wrapping in enumerate(
+        agent.handoffs.get_context_conditions_requiring_wrapping()
+    ):
+        # Create wrapper agent
+        wrapper_agent = handoff_oncontextcondition_requiring_wrapping.target.create_wrapper_agent(
+            parent_agent=agent, index=i
+        )
+        wrapped_agent_list.append(wrapper_agent)
+
+        # Change this handoff target to point to the newly created agent
+        handoff_oncontextcondition_requiring_wrapping.target = AgentTarget(wrapper_agent)
+
+
+def process_initial_messages(
+    messages: Union[list[dict[str, Any]], str],
+    user_agent: Optional["ConversableAgent"],
+    agents: list["ConversableAgent"],
+    wrapped_agents: list["ConversableAgent"],
+) -> tuple[list[dict[str, Any]], Optional["ConversableAgent"], list[str], list[Agent]]:
+    """Process initial messages, validating agent names against messages, and determining the last agent to speak.
+
+    Args:
+        messages: Initial messages to process.
+        user_agent: Optional user proxy agent passed in to a_/initiate_group_chat.
+        agents: Agents in the group.
+        wrapped_agents: List of wrapped agents.
+
+    Returns:
+        list[dict[str, Any]]: Processed message(s).
+        Agent: Last agent to speak.
+        list[str]: List of agent names.
+        list[Agent]: List of temporary user proxy agents to add to GroupChat.
+    """
+    from ..conversable_agent import ConversableAgent  # NEED SOLUTION
+
+    if isinstance(messages, str):
+        messages = [{"role": "user", "content": messages}]
+
+    group_agent_names = [agent.name for agent in agents + wrapped_agents]
+
+    # If there's only one message and there's no identified group agent
+    # Start with a user proxy agent, creating one if they haven't passed one in
+    last_agent: Optional[ConversableAgent]
+    temp_user_proxy: Optional[ConversableAgent] = None
+    temp_user_list: list[Agent] = []
+    if len(messages) == 1 and "name" not in messages[0] and not user_agent:
+        temp_user_proxy = ConversableAgent(name="_User", code_execution_config=False, human_input_mode="ALWAYS")
+        last_agent = temp_user_proxy
+        temp_user_list.append(temp_user_proxy)
+    else:
+        last_message = messages[0]
+        if "name" in last_message:
+            if last_message["name"] in group_agent_names:
+                last_agent = next(agent for agent in agents + wrapped_agents if agent.name == last_message["name"])  # type: ignore[assignment]
+            elif user_agent and last_message["name"] == user_agent.name:
+                last_agent = user_agent
+            else:
+                raise ValueError(f"Invalid group agent name in last message: {last_message['name']}")
+        else:
+            last_agent = user_agent if user_agent else temp_user_proxy
+
+    return messages, last_agent, group_agent_names, temp_user_list
+
+
+def setup_context_variables(
+    tool_execution: "ConversableAgent",
+    agents: list["ConversableAgent"],
+    manager: GroupChatManager,
+    user_agent: Optional["ConversableAgent"],
+    context_variables: ContextVariables,
+) -> None:
+    """Assign a common context_variables reference to all agents in the group, including the tool executor, group chat manager, and user proxy agent.
+
+    Args:
+        tool_execution: The tool execution agent.
+        agents: List of all agents in the conversation.
+        manager: GroupChatManager instance.
+        user_agent: Optional user proxy agent.
+        context_variables: Context variables to assign to all agents.
+    """
+    for agent in agents + [tool_execution] + [manager] + ([user_agent] if user_agent else []):
+        agent.context_variables = context_variables
+
+
+def cleanup_temp_user_messages(chat_result: Any) -> None:
+    """Remove temporary user proxy agent name from messages before returning.
+
+    Args:
+        chat_result: ChatResult instance.
+    """
+    for message in chat_result.chat_history:
+        if "name" in message and message["name"] == "_User":
+            del message["name"]
+
+
+def get_last_agent_speaker(
+    groupchat: GroupChat, group_agent_names: list[str], tool_executor: GroupToolExecutor
+) -> Agent:
+    """Get the last group agent from the group chat messages. Not including the tool executor."""
+    last_group_speaker = None
+    for message in reversed(groupchat.messages):
+        if "name" in message and message["name"] in group_agent_names and message["name"] != tool_executor.name:
+            agent = groupchat.agent_by_name(name=message["name"])
+            if agent:
+                last_group_speaker = agent
+                break
+    if last_group_speaker is None:
+        raise ValueError("No group agent found in the message history")
+
+    return last_group_speaker
+
+
+def determine_next_agent(
+    last_speaker: "ConversableAgent",
+    groupchat: GroupChat,
+    initial_agent: "ConversableAgent",
+    use_initial_agent: bool,
+    tool_executor: GroupToolExecutor,
+    group_agent_names: list[str],
+    user_agent: Optional["ConversableAgent"],
+    group_after_work: TransitionTarget,
+) -> Optional[Union[Agent, str]]:
+    """Determine the next agent in the conversation.
+
+    Args:
+        last_speaker ("ConversableAgent"): The last agent to speak.
+        groupchat (GroupChat): GroupChat instance.
+        initial_agent ("ConversableAgent"): The initial agent in the conversation.
+        use_initial_agent (bool): Whether to use the initial agent straight away.
+        tool_executor ("ConversableAgent"): The tool execution agent.
+        group_agent_names (list[str]): List of agent names.
+        user_agent (UserProxyAgent): Optional user proxy agent.
+        group_after_work (TransitionTarget): Group-level Transition option when an agent doesn't select the next agent.
+
+    Returns:
+        Optional[Union[Agent, str]]: The next agent or speaker selection method.
+    """
+
+    # Logic for determining the next target (anything based on Transition Target: an agent, wrapped agent, TerminateTarget, StayTarget, RevertToUserTarget, GroupManagerTarget, etc.
+    # 1. If it's the first response -> initial agent
+    # 2. If the last message is a tool call -> tool execution agent
+    # 3. If the Tool Executor has determined a next target (e.g. ReplyResult specified target) -> transition to tool reply target
+    # 4. If the user last spoke -> return to the previous agent
+    # NOW "AFTER WORK":
+    # 5. Get the After Work condition (if the agent doesn't have one, get the group-level one)
+    # 6. Resolve and return the After Work condition -> agent / wrapped agent / TerminateTarget / StayTarget / RevertToUserTarget / GroupManagerTarget / etc.
+
+    # 1. If it's the first response, return the initial agent
+    if use_initial_agent:
+        return initial_agent
+
+    # 2. If the last message is a tool call, return the tool execution agent
+    if "tool_calls" in groupchat.messages[-1]:
+        return tool_executor
+
+    # 3. If the Tool Executor has determined a next target, return that
+    if tool_executor.has_next_target():
+        next_agent = tool_executor.get_next_target()
+        tool_executor.clear_next_target()
+
+        if next_agent.can_resolve_for_speaker_selection():
+            return next_agent.resolve(groupchat, last_speaker, user_agent).get_speaker_selection_result(groupchat)
+        else:
+            raise ValueError(
+                "Tool Executor next target must be a valid TransitionTarget that can resolve for speaker selection."
+            )
+
+    # get the last group agent
+    last_agent_speaker = get_last_agent_speaker(groupchat, group_agent_names, tool_executor)
+
+    # If we are returning from a tool execution, return to the last agent that spoke
+    if groupchat.messages[-1]["role"] == "tool":
+        return last_agent_speaker
+
+    # If the user last spoke, return to the agent prior to them (if they don't have an after work, otherwise it's treated like any other agent)
+    if user_agent and last_speaker == user_agent:
+        if not user_agent.handoffs.after_works:
+            return last_agent_speaker
+        else:
+            last_agent_speaker = user_agent
+
+    # AFTER WORK:
+
+    # First, try to evaluate after_works context conditions
+    after_works_result = _evaluate_after_works_conditions(
+        last_agent_speaker,  # type: ignore[arg-type]
+        groupchat,
+        user_agent,
+    )
+    if after_works_result is not None:
+        return after_works_result
+
+    # If no after_works conditions matched, use the group-level after_work
+    # Resolve the next agent, termination, or speaker selection method
+    resolved_speaker_selection_result = group_after_work.resolve(
+        groupchat,
+        last_agent_speaker,  # type: ignore[arg-type]
+        user_agent,
+    ).get_speaker_selection_result(groupchat)
+
+    return resolved_speaker_selection_result
+
+
+def create_group_transition(
+    initial_agent: "ConversableAgent",
+    tool_execution: GroupToolExecutor,
+    group_agent_names: list[str],
+    user_agent: Optional["ConversableAgent"],
+    group_after_work: TransitionTarget,
+) -> Callable[["ConversableAgent", GroupChat], Optional[Union[Agent, str]]]:
+    """Creates a transition function for group chat with enclosed state for the use_initial_agent.
+
+    Args:
+        initial_agent ("ConversableAgent"): The first agent to speak
+        tool_execution (GroupToolExecutor): The tool execution agent
+        group_agent_names (list[str]): List of all agent names
+        user_agent (UserProxyAgent): Optional user proxy agent
+        group_after_work (TransitionTarget): Group-level after work
+
+    Returns:
+        Callable[["ConversableAgent", GroupChat], Optional[Union[Agent, str]]]: The transition function
+    """
+    # Create enclosed state, this will be set once per creation so will only be True on the first execution
+    # of group_transition
+    state = {"use_initial_agent": True}
+
+    def group_transition(last_speaker: "ConversableAgent", groupchat: GroupChat) -> Optional[Union[Agent, str]]:
+        result = determine_next_agent(
+            last_speaker=last_speaker,
+            groupchat=groupchat,
+            initial_agent=initial_agent,
+            use_initial_agent=state["use_initial_agent"],
+            tool_executor=tool_execution,
+            group_agent_names=group_agent_names,
+            user_agent=user_agent,
+            group_after_work=group_after_work,
+        )
+        state["use_initial_agent"] = False
+        return result
+
+    return group_transition
+
+
+def create_group_manager(
+    groupchat: GroupChat,
+    group_manager_args: Optional[dict[str, Any]],
+    agents: list["ConversableAgent"],
+    group_after_work: TransitionTarget,
+) -> GroupChatManager:
+    """Create a GroupChatManager for the group chat utilising any arguments passed in and ensure an LLM Config exists if needed
+
+    Args:
+        groupchat (GroupChat): The groupchat.
+        group_manager_args (dict[str, Any]): Group manager arguments to create the GroupChatManager.
+        agents (list["ConversableAgent"]): List of agents in the group to check handoffs and after work.
+        group_after_work (TransitionTarget): Group-level after work to check.
+
+    Returns:
+        GroupChatManager: GroupChatManager instance.
+    """
+    manager_args = (group_manager_args or {}).copy()
+    if "groupchat" in manager_args:
+        raise ValueError("'groupchat' cannot be specified in group_manager_args as it is set by initiate_group_chat")
+    manager = GroupChatManager(groupchat, **manager_args)
+
+    # Ensure that our manager has an LLM Config if we have any GroupManagerTarget targets used
+    if manager.llm_config is False:
+        has_group_manager_target = False
+
+        if isinstance(group_after_work, GroupManagerTarget):
+            # Check group after work
+            has_group_manager_target = True
+        else:
+            # Check agent hand-offs and after work
+            for agent in agents:
+                if (
+                    len(agent.handoffs.get_context_conditions_by_target_type(GroupManagerTarget)) > 0
+                    or len(agent.handoffs.get_llm_conditions_by_target_type(GroupManagerTarget)) > 0
+                    or any(isinstance(aw.target, GroupManagerTarget) for aw in agent.handoffs.after_works)
+                ):
+                    has_group_manager_target = True
+                    break
+
+        if has_group_manager_target:
+            raise ValueError(
+                "The group manager doesn't have an LLM Config and it is required for any targets or after works using a GroupManagerTarget. Use the 'llm_config' in the group_manager_args parameter to specify the LLM Config for the group manager."
+            )
+
+    return manager
+
+
+def make_remove_function(tool_msgs_to_remove: list[str]) -> Callable[[list[dict[str, Any]]], list[dict[str, Any]]]:
+    """Create a function to remove messages with tool calls from the messages list.
+
+    The returned function can be registered as a hook to "process_all_messages_before_reply"" to remove messages with tool calls.
+    """
+
+    def remove_messages(messages: list[dict[str, Any]], tool_msgs_to_remove: list[str]) -> list[dict[str, Any]]:
+        copied = copy.deepcopy(messages)
+        new_messages = []
+        removed_tool_ids = []
+        for message in copied:
+            # remove tool calls
+            if message.get("tool_calls") is not None:
+                filtered_tool_calls = []
+                for tool_call in message["tool_calls"]:
+                    if tool_call.get("function") is not None and tool_call["function"]["name"] in tool_msgs_to_remove:
+                        # remove
+                        removed_tool_ids.append(tool_call["id"])
+                    else:
+                        filtered_tool_calls.append(tool_call)
+                if len(filtered_tool_calls) > 0:
+                    message["tool_calls"] = filtered_tool_calls
+                else:
+                    del message["tool_calls"]
+                    if (
+                        message.get("content") is None
+                        or message.get("content") == ""
+                        or message.get("content") == "None"
+                    ):
+                        continue  # if no tool call and no content, skip this message
+                    # else: keep the message with tool_calls removed
+            # remove corresponding tool responses
+            elif message.get("tool_responses") is not None:
+                filtered_tool_responses = []
+                for tool_response in message["tool_responses"]:
+                    if tool_response["tool_call_id"] not in removed_tool_ids:
+                        filtered_tool_responses.append(tool_response)
+
+                if len(filtered_tool_responses) > 0:
+                    message["tool_responses"] = filtered_tool_responses
+                else:
+                    continue
+
+            new_messages.append(message)
+
+        return new_messages
+
+    return partial(remove_messages, tool_msgs_to_remove=tool_msgs_to_remove)
diff --git a/mm_agents/coact/autogen/agentchat/group/handoffs.py b/mm_agents/coact/autogen/agentchat/group/handoffs.py
new file mode 100644
index 0000000..4d62f2e
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/handoffs.py
@@ -0,0 +1,320 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Union, overload
+
+from pydantic import BaseModel, Field
+
+from .on_condition import OnCondition
+from .on_context_condition import OnContextCondition
+from .targets.transition_target import TransitionTarget
+
+__all__ = ["Handoffs"]
+
+
+class Handoffs(BaseModel):
+    """
+    Container for all handoff transition conditions of a ConversableAgent.
+
+    Three types of conditions can be added, each with a different order and time of use:
+    1. OnContextConditions (evaluated without an LLM)
+    2. OnConditions (evaluated with an LLM)
+    3. After work TransitionTarget (if no other transition is triggered)
+
+    Supports method chaining:
+    agent.handoffs.add_context_conditions([condition1]) \
+                   .add_llm_condition(condition2) \
+                   .set_after_work(after_work)
+    """
+
+    context_conditions: list[OnContextCondition] = Field(default_factory=list)
+    llm_conditions: list[OnCondition] = Field(default_factory=list)
+    after_works: list[OnContextCondition] = Field(default_factory=list)
+
+    def add_context_condition(self, condition: OnContextCondition) -> "Handoffs":
+        """
+        Add a single context condition.
+
+        Args:
+            condition: The OnContextCondition to add
+
+        Returns:
+            Self for method chaining
+        """
+        # Validate that it is an OnContextCondition
+        if not isinstance(condition, OnContextCondition):
+            raise TypeError(f"Expected an OnContextCondition instance, got {type(condition).__name__}")
+
+        self.context_conditions.append(condition)
+        return self
+
+    def add_context_conditions(self, conditions: list[OnContextCondition]) -> "Handoffs":
+        """
+        Add multiple context conditions.
+
+        Args:
+            conditions: List of OnContextConditions to add
+
+        Returns:
+            Self for method chaining
+        """
+        # Validate that it is a list of OnContextConditions
+        if not all(isinstance(condition, OnContextCondition) for condition in conditions):
+            raise TypeError("All conditions must be of type OnContextCondition")
+
+        self.context_conditions.extend(conditions)
+        return self
+
+    def add_llm_condition(self, condition: OnCondition) -> "Handoffs":
+        """
+        Add a single LLM condition.
+
+        Args:
+            condition: The OnCondition to add
+
+        Returns:
+            Self for method chaining
+        """
+        # Validate that it is an OnCondition
+        if not isinstance(condition, OnCondition):
+            raise TypeError(f"Expected an OnCondition instance, got {type(condition).__name__}")
+
+        self.llm_conditions.append(condition)
+        return self
+
+    def add_llm_conditions(self, conditions: list[OnCondition]) -> "Handoffs":
+        """
+        Add multiple LLM conditions.
+
+        Args:
+            conditions: List of OnConditions to add
+
+        Returns:
+            Self for method chaining
+        """
+        # Validate that it is a list of OnConditions
+        if not all(isinstance(condition, OnCondition) for condition in conditions):
+            raise TypeError("All conditions must be of type OnCondition")
+
+        self.llm_conditions.extend(conditions)
+        return self
+
+    def set_after_work(self, target: TransitionTarget) -> "Handoffs":
+        """
+        Set the after work target (replaces all after_works with single entry).
+
+        For backward compatibility, this creates an OnContextCondition with no condition (always true).
+
+        Args:
+            target: The after work TransitionTarget to set
+
+        Returns:
+            Self for method chaining
+        """
+        if not isinstance(target, TransitionTarget):
+            raise TypeError(f"Expected a TransitionTarget instance, got {type(target).__name__}")
+
+        # Create OnContextCondition with no condition (always true)
+        after_work_condition = OnContextCondition(target=target, condition=None)
+        self.after_works = [after_work_condition]
+        return self
+
+    def add_after_work(self, condition: OnContextCondition) -> "Handoffs":
+        """
+        Add a single after-work condition.
+
+        If the condition has condition=None, it will replace any existing
+        condition=None entry and be placed at the end.
+
+        Args:
+            condition: The OnContextCondition to add
+
+        Returns:
+            Self for method chaining
+        """
+        if not isinstance(condition, OnContextCondition):
+            raise TypeError(f"Expected an OnContextCondition instance, got {type(condition).__name__}")
+
+        if condition.condition is None:
+            # Remove any existing condition=None entries
+            self.after_works = [c for c in self.after_works if c.condition is not None]
+            # Add the new one at the end
+            self.after_works.append(condition)
+        else:
+            # For regular conditions, check if we need to move condition=None to the end
+            none_conditions = [c for c in self.after_works if c.condition is None]
+            if none_conditions:
+                # Remove the None condition temporarily
+                self.after_works = [c for c in self.after_works if c.condition is not None]
+                # Add the new regular condition
+                self.after_works.append(condition)
+                # Re-add the None condition at the end
+                self.after_works.append(none_conditions[0])
+            else:
+                # No None condition exists, just append
+                self.after_works.append(condition)
+
+        return self
+
+    def add_after_works(self, conditions: list[OnContextCondition]) -> "Handoffs":
+        """
+        Add multiple after-work conditions.
+
+        Special handling for condition=None entries:
+        - Only one condition=None entry is allowed (the fallback)
+        - It will always be placed at the end of the list
+        - If multiple condition=None entries are provided, only the last one is kept
+
+        Args:
+            conditions: List of OnContextConditions to add
+
+        Returns:
+            Self for method chaining
+        """
+        # Validate that it is a list of OnContextConditions
+        if not all(isinstance(condition, OnContextCondition) for condition in conditions):
+            raise TypeError("All conditions must be of type OnContextCondition")
+
+        # Separate conditions with None and without None
+        none_conditions = [c for c in conditions if c.condition is None]
+        regular_conditions = [c for c in conditions if c.condition is not None]
+
+        # Remove any existing condition=None entries
+        self.after_works = [c for c in self.after_works if c.condition is not None]
+
+        # Add regular conditions
+        self.after_works.extend(regular_conditions)
+
+        # Add at most one None condition at the end
+        if none_conditions:
+            self.after_works.append(none_conditions[-1])  # Use the last one if multiple provided
+
+        return self
+
+    @overload
+    def add(self, condition: OnContextCondition) -> "Handoffs": ...
+
+    @overload
+    def add(self, condition: OnCondition) -> "Handoffs": ...
+
+    def add(self, condition: Union[OnContextCondition, OnCondition]) -> "Handoffs":
+        """
+        Add a single condition (OnContextCondition or OnCondition).
+
+        Args:
+            condition: The condition to add (OnContextCondition or OnCondition)
+
+        Raises:
+            TypeError: If the condition type is not supported
+
+        Returns:
+            Self for method chaining
+        """
+        # This add method is a helper method designed to make it easier for
+        # adding handoffs without worrying about the specific type.
+        if isinstance(condition, OnContextCondition):
+            return self.add_context_condition(condition)
+        elif isinstance(condition, OnCondition):
+            return self.add_llm_condition(condition)
+        else:
+            raise TypeError(f"Unsupported condition type: {type(condition).__name__}")
+
+    def add_many(self, conditions: list[Union[OnContextCondition, OnCondition]]) -> "Handoffs":
+        """
+        Add multiple conditions of any supported types (OnContextCondition and OnCondition).
+
+        Args:
+            conditions: List of conditions to add
+
+        Raises:
+            TypeError: If an unsupported condition type is provided
+
+        Returns:
+            Self for method chaining
+        """
+        # This add_many method is a helper method designed to make it easier for
+        # adding handoffs without worrying about the specific type.
+        context_conditions = []
+        llm_conditions = []
+
+        for condition in conditions:
+            if isinstance(condition, OnContextCondition):
+                context_conditions.append(condition)
+            elif isinstance(condition, OnCondition):
+                llm_conditions.append(condition)
+            else:
+                raise TypeError(f"Unsupported condition type: {type(condition).__name__}")
+
+        if context_conditions:
+            self.add_context_conditions(context_conditions)
+        if llm_conditions:
+            self.add_llm_conditions(llm_conditions)
+
+        return self
+
+    def clear(self) -> "Handoffs":
+        """
+        Clear all handoff conditions.
+
+        Returns:
+            Self for method chaining
+        """
+        self.context_conditions.clear()
+        self.llm_conditions.clear()
+        self.after_works.clear()
+        return self
+
+    def get_llm_conditions_by_target_type(self, target_type: type) -> list[OnCondition]:
+        """
+        Get OnConditions for a specific target type.
+
+        Args:
+            target_type: The type of condition to retrieve
+
+        Returns:
+            List of conditions of the specified type, or None if none exist
+        """
+        return [on_condition for on_condition in self.llm_conditions if on_condition.has_target_type(target_type)]
+
+    def get_context_conditions_by_target_type(self, target_type: type) -> list[OnContextCondition]:
+        """
+        Get OnContextConditions for a specific target type.
+
+        Args:
+            target_type: The type of condition to retrieve
+
+        Returns:
+            List of conditions of the specified type, or None if none exist
+        """
+        return [
+            on_context_condition
+            for on_context_condition in self.context_conditions
+            if on_context_condition.has_target_type(target_type)
+        ]
+
+    def get_llm_conditions_requiring_wrapping(self) -> list[OnCondition]:
+        """
+        Get LLM conditions that have targets that require wrapping.
+
+        Returns:
+            List of LLM conditions that require wrapping
+        """
+        return [condition for condition in self.llm_conditions if condition.target_requires_wrapping()]
+
+    def get_context_conditions_requiring_wrapping(self) -> list[OnContextCondition]:
+        """
+        Get context conditions that have targets that require wrapping.
+
+        Returns:
+            List of context conditions that require wrapping
+        """
+        return [condition for condition in self.context_conditions if condition.target_requires_wrapping()]
+
+    def set_llm_function_names(self) -> None:
+        """
+        Set the LLM function names for all LLM conditions, creating unique names for each function.
+        """
+        for i, condition in enumerate(self.llm_conditions):
+            # Function names are made unique and allow multiple OnCondition's to the same agent
+            condition.llm_function_name = f"transfer_to_{condition.target.normalized_name()}_{i + 1}"
diff --git a/mm_agents/coact/autogen/agentchat/group/llm_condition.py b/mm_agents/coact/autogen/agentchat/group/llm_condition.py
new file mode 100644
index 0000000..8bc13fe
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/llm_condition.py
@@ -0,0 +1,93 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any
+
+from pydantic import BaseModel
+
+from .context_str import ContextStr
+
+if TYPE_CHECKING:
+    # Avoid circular import
+    from ..conversable_agent import ConversableAgent
+
+__all__ = ["ContextStrLLMCondition", "LLMCondition", "StringLLMCondition"]
+
+
+class LLMCondition(BaseModel):
+    """Protocol for conditions evaluated by an LLM."""
+
+    def get_prompt(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> str:
+        """Get the prompt text for LLM evaluation.
+
+        Args:
+            agent: The agent evaluating the condition
+            messages: The conversation history
+
+        Returns:
+            The prompt text to be evaluated by the LLM
+        """
+        raise NotImplementedError("Requires subclasses to implement.")
+
+
+class StringLLMCondition(LLMCondition):
+    """Simple string-based LLM condition.
+
+    This condition provides a static string prompt to be evaluated by an LLM.
+    """
+
+    prompt: str
+
+    def __init__(self, prompt: str, **data: Any) -> None:
+        """Initialize with a prompt string as a positional parameter.
+
+        Args:
+            prompt: The static prompt string to evaluate
+            data: Additional data for the parent class
+        """
+        super().__init__(prompt=prompt, **data)
+
+    def get_prompt(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> str:
+        """Return the static prompt string.
+
+        Args:
+            agent: The agent evaluating the condition (not used)
+            messages: The conversation history (not used)
+
+        Returns:
+            The static prompt string
+        """
+        return self.prompt
+
+
+class ContextStrLLMCondition(LLMCondition):
+    """Context variable-based LLM condition.
+
+    This condition uses a ContextStr object with context variable placeholders that
+    will be substituted before being evaluated by an LLM.
+    """
+
+    context_str: ContextStr
+
+    def __init__(self, context_str: ContextStr, **data: Any) -> None:
+        """Initialize with a context string as a positional parameter.
+
+        Args:
+            context_str: The ContextStr object with variable placeholders
+            data: Additional data for the parent class
+        """
+        super().__init__(context_str=context_str, **data)
+
+    def get_prompt(self, agent: "ConversableAgent", messages: list[dict[str, Any]]) -> str:
+        """Return the prompt with context variables substituted.
+
+        Args:
+            agent: The agent evaluating the condition (provides context variables)
+            messages: The conversation history (not used)
+
+        Returns:
+            The prompt with context variables substituted
+        """
+        result = self.context_str.format(agent.context_variables)
+        return result if result is not None else ""
diff --git a/mm_agents/coact/autogen/agentchat/group/multi_agent_chat.py b/mm_agents/coact/autogen/agentchat/group/multi_agent_chat.py
new file mode 100644
index 0000000..7e0a91c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/multi_agent_chat.py
@@ -0,0 +1,237 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+import threading
+from typing import TYPE_CHECKING, Any, Union
+
+from ...doc_utils import export_module
+from ...events.agent_events import ErrorEvent, RunCompletionEvent
+from ...io.base import IOStream
+from ...io.run_response import AsyncRunResponse, AsyncRunResponseProtocol, RunResponse, RunResponseProtocol
+from ...io.thread_io_stream import AsyncThreadIOStream, ThreadIOStream
+from ..chat import ChatResult
+from .context_variables import ContextVariables
+from .group_utils import cleanup_temp_user_messages
+
+if TYPE_CHECKING:
+    from ..agent import Agent
+    from .patterns.pattern import Pattern
+
+__all__ = [
+    "a_initiate_group_chat",
+    "a_run_group_chat",
+    "initiate_group_chat",
+    "run_group_chat",
+]
+
+
+@export_module("autogen")
+def initiate_group_chat(
+    pattern: "Pattern",
+    messages: Union[list[dict[str, Any]], str],
+    max_rounds: int = 20,
+) -> tuple[ChatResult, ContextVariables, "Agent"]:
+    """Initialize and run a group chat using a pattern for configuration.
+
+    Args:
+        pattern: Pattern object that encapsulates the chat configuration.
+        messages: Initial message(s).
+        max_rounds: Maximum number of conversation rounds.
+
+    Returns:
+        ChatResult:         Conversations chat history.
+        ContextVariables:   Updated Context variables.
+        "ConversableAgent":   Last speaker.
+    """
+    # Let the pattern prepare the group chat and all its components
+    # Only passing the necessary parameters that aren't already in the pattern
+    (
+        _,  # agents,
+        _,  # wrapped_agents,
+        _,  # user_agent,
+        context_variables,
+        _,  # initial_agent,
+        _,  # group_after_work,
+        _,  # tool_execution,
+        _,  # groupchat,
+        manager,
+        processed_messages,
+        last_agent,
+        _,  # group_agent_names,
+        _,  # temp_user_list,
+    ) = pattern.prepare_group_chat(
+        max_rounds=max_rounds,
+        messages=messages,
+    )
+
+    # Start or resume the conversation
+    if len(processed_messages) > 1:
+        last_agent, last_message = manager.resume(messages=processed_messages)
+        clear_history = False
+    else:
+        last_message = processed_messages[0]
+        clear_history = True
+
+    if last_agent is None:
+        raise ValueError("No agent selected to start the conversation")
+
+    chat_result = last_agent.initiate_chat(
+        manager,
+        message=last_message,
+        clear_history=clear_history,
+        summary_method=pattern.summary_method,
+    )
+
+    cleanup_temp_user_messages(chat_result)
+
+    return chat_result, context_variables, manager.last_speaker
+
+
+@export_module("autogen.agentchat")
+async def a_initiate_group_chat(
+    pattern: "Pattern",
+    messages: Union[list[dict[str, Any]], str],
+    max_rounds: int = 20,
+) -> tuple[ChatResult, ContextVariables, "Agent"]:
+    """Initialize and run a group chat using a pattern for configuration, asynchronously.
+
+    Args:
+        pattern: Pattern object that encapsulates the chat configuration.
+        messages: Initial message(s).
+        max_rounds: Maximum number of conversation rounds.
+
+    Returns:
+        ChatResult:         Conversations chat history.
+        ContextVariables:   Updated Context variables.
+        "ConversableAgent":   Last speaker.
+    """
+    # Let the pattern prepare the group chat and all its components
+    # Only passing the necessary parameters that aren't already in the pattern
+    (
+        _,  # agents,
+        _,  # wrapped_agents,
+        _,  # user_agent,
+        context_variables,
+        _,  # initial_agent,
+        _,  # group_after_work,
+        _,  # tool_execution,
+        _,  # groupchat,
+        manager,
+        processed_messages,
+        last_agent,
+        _,  # group_agent_names,
+        _,  # temp_user_list,
+    ) = pattern.prepare_group_chat(
+        max_rounds=max_rounds,
+        messages=messages,
+    )
+
+    # Start or resume the conversation
+    if len(processed_messages) > 1:
+        last_agent, last_message = await manager.a_resume(messages=processed_messages)
+        clear_history = False
+    else:
+        last_message = processed_messages[0]
+        clear_history = True
+
+    if last_agent is None:
+        raise ValueError("No agent selected to start the conversation")
+
+    chat_result = await last_agent.a_initiate_chat(
+        manager,
+        message=last_message,  # type: ignore[arg-type]
+        clear_history=clear_history,
+        summary_method=pattern.summary_method,
+    )
+
+    cleanup_temp_user_messages(chat_result)
+
+    return chat_result, context_variables, manager.last_speaker
+
+
+@export_module("autogen.agentchat")
+def run_group_chat(
+    pattern: "Pattern",
+    messages: Union[list[dict[str, Any]], str],
+    max_rounds: int = 20,
+) -> RunResponseProtocol:
+    iostream = ThreadIOStream()
+    # todo: add agents
+    response = RunResponse(iostream, agents=[])
+
+    def _initiate_group_chat(
+        pattern: "Pattern" = pattern,
+        messages: Union[list[dict[str, Any]], str] = messages,
+        max_rounds: int = max_rounds,
+        iostream: ThreadIOStream = iostream,
+        response: RunResponse = response,
+    ) -> None:
+        with IOStream.set_default(iostream):
+            try:
+                chat_result, context_vars, agent = initiate_group_chat(
+                    pattern=pattern,
+                    messages=messages,
+                    max_rounds=max_rounds,
+                )
+
+                IOStream.get_default().send(
+                    RunCompletionEvent(  # type: ignore[call-arg]
+                        history=chat_result.chat_history,
+                        summary=chat_result.summary,
+                        cost=chat_result.cost,
+                        last_speaker=agent.name,
+                        context_variables=context_vars,
+                    )
+                )
+            except Exception as e:
+                response.iostream.send(ErrorEvent(error=e))  # type: ignore[call-arg]
+
+    threading.Thread(
+        target=_initiate_group_chat,
+    ).start()
+
+    return response
+
+
+@export_module("autogen.agentchat")
+async def a_run_group_chat(
+    pattern: "Pattern",
+    messages: Union[list[dict[str, Any]], str],
+    max_rounds: int = 20,
+) -> AsyncRunResponseProtocol:
+    iostream = AsyncThreadIOStream()
+    # todo: add agents
+    response = AsyncRunResponse(iostream, agents=[])
+
+    async def _initiate_group_chat(
+        pattern: "Pattern" = pattern,
+        messages: Union[list[dict[str, Any]], str] = messages,
+        max_rounds: int = max_rounds,
+        iostream: AsyncThreadIOStream = iostream,
+        response: AsyncRunResponse = response,
+    ) -> None:
+        with IOStream.set_default(iostream):
+            try:
+                chat_result, context_vars, agent = await a_initiate_group_chat(
+                    pattern=pattern,
+                    messages=messages,
+                    max_rounds=max_rounds,
+                )
+
+                IOStream.get_default().send(
+                    RunCompletionEvent(  # type: ignore[call-arg]
+                        history=chat_result.chat_history,
+                        summary=chat_result.summary,
+                        cost=chat_result.cost,
+                        last_speaker=agent.name,
+                        context_variables=context_vars,
+                    )
+                )
+            except Exception as e:
+                response.iostream.send(ErrorEvent(error=e))  # type: ignore[call-arg]
+
+    asyncio.create_task(_initiate_group_chat())
+
+    return response
diff --git a/mm_agents/coact/autogen/agentchat/group/on_condition.py b/mm_agents/coact/autogen/agentchat/group/on_condition.py
new file mode 100644
index 0000000..8360dc0
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/on_condition.py
@@ -0,0 +1,58 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Optional
+
+from pydantic import BaseModel
+
+from ...doc_utils import export_module
+from .available_condition import AvailableCondition
+from .llm_condition import LLMCondition
+from .targets.transition_target import TransitionTarget
+
+__all__ = [
+    "OnCondition",
+]
+
+
+@export_module("autogen")
+class OnCondition(BaseModel):  # noqa: N801
+    """Defines a condition for transitioning to another agent or nested chats.
+
+    This is for LLM-based condition evaluation where these conditions are translated into tools and attached to the agent.
+
+    These are evaluated after the OnCondition conditions but before the after work condition.
+
+    Args:
+        target (TransitionTarget): The transition (essentially an agent) to hand off to.
+        condition (LLMCondition): The condition for transitioning to the target agent, evaluated by the LLM.
+        available (AvailableCondition): Optional condition to determine if this OnCondition is included for the LLM to evaluate based on context variables using classes like StringAvailableCondition and ContextExpressionAvailableCondition.
+        llm_function_name (Optional[str]): The name of the LLM function to use for this condition.
+    """
+
+    target: TransitionTarget
+    condition: LLMCondition
+    available: Optional[AvailableCondition] = None
+    llm_function_name: Optional[str] = None
+
+    def has_target_type(self, target_type: type) -> bool:
+        """
+        Check if the target type matches the specified type.
+
+        Args:
+            target_type (type): The target type to check against, which should be a subclass of TransitionTarget
+
+        Returns:
+            bool: True if the target type matches, False otherwise
+        """
+        return isinstance(self.target, target_type)
+
+    def target_requires_wrapping(self) -> bool:
+        """
+        Check if the target requires wrapping in an agent.
+
+        Returns:
+            bool: True if the target requires wrapping, False otherwise
+        """
+        return self.target.needs_agent_wrapper()
diff --git a/mm_agents/coact/autogen/agentchat/group/on_context_condition.py b/mm_agents/coact/autogen/agentchat/group/on_context_condition.py
new file mode 100644
index 0000000..013f1c1
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/on_context_condition.py
@@ -0,0 +1,54 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Optional
+
+from pydantic import BaseModel
+
+from .available_condition import AvailableCondition
+from .context_condition import ContextCondition
+from .targets.transition_target import TransitionTarget
+
+__all__ = [
+    "OnContextCondition",
+]
+
+
+class OnContextCondition(BaseModel):  # noqa: N801
+    """Defines a condition for transitioning to another agent or nested chats using context variables and the ContextExpression class.
+
+    This is for context variable-based condition evaluation (does not use the agent's LLM).
+
+    These are evaluated before the OnCondition and after work conditions.
+
+    Args:
+        target (TransitionTarget): The transition (essentially an agent) to hand off to.
+        condition (Optional[ContextCondition]): The context variable based condition for transitioning to the target agent. If None, the condition always evaluates to True.
+        available (AvailableCondition): Optional condition to determine if this OnCondition is included for the LLM to evaluate based on context variables using classes like StringAvailableCondition and ContextExpressionAvailableCondition.
+    """
+
+    target: TransitionTarget
+    condition: Optional[ContextCondition] = None
+    available: Optional[AvailableCondition] = None
+
+    def has_target_type(self, target_type: type) -> bool:
+        """
+        Check if the target type matches the specified type.
+
+        Args:
+            target_type (type): The target type to check against. Should be a subclass of TransitionTarget.
+
+        Returns:
+            bool: True if the target type matches, False otherwise
+        """
+        return isinstance(self.target, target_type)
+
+    def target_requires_wrapping(self) -> bool:
+        """
+        Check if the target requires wrapping in an agent.
+
+        Returns:
+            bool: True if the target requires wrapping, False otherwise
+        """
+        return self.target.needs_agent_wrapper()
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/__init__.py b/mm_agents/coact/autogen/agentchat/group/patterns/__init__.py
new file mode 100644
index 0000000..a26451c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/__init__.py
@@ -0,0 +1,18 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from .auto import AutoPattern
+from .manual import ManualPattern
+from .pattern import DefaultPattern
+from .random import RandomPattern
+from .round_robin import RoundRobinPattern
+
+__all__ = [
+    "AutoPattern",
+    "DefaultPattern",
+    "ManualPattern",
+    "RandomPattern",
+    "RoundRobinPattern",
+]
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/auto.py b/mm_agents/coact/autogen/agentchat/group/patterns/auto.py
new file mode 100644
index 0000000..f4a1d71
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/auto.py
@@ -0,0 +1,159 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Callable, Optional, Tuple, Union
+
+from ..context_variables import ContextVariables
+from ..targets.group_manager_target import GroupManagerSelectionMessage, GroupManagerTarget
+from ..targets.transition_target import TransitionTarget
+from .pattern import Pattern
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat, GroupChatManager
+    from ..group_tool_executor import GroupToolExecutor
+
+
+class AutoPattern(Pattern):
+    """AutoPattern implements a flexible pattern where agents are selected based on their expertise.
+
+    In this pattern, a group manager automatically selects the next agent to speak based on the context
+    of the conversation and agent descriptions. The after_work is always set to "group_manager" as
+    this is the defining characteristic of this pattern.
+    """
+
+    def __init__(
+        self,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"] = None,
+        group_manager_args: Optional[dict[str, Any]] = None,
+        context_variables: Optional[ContextVariables] = None,
+        selection_message: Optional[GroupManagerSelectionMessage] = None,
+        exclude_transit_message: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = "last_msg",
+    ):
+        """Initialize the AutoPattern.
+
+        The after_work is always set to group_manager selection, which is the defining
+        characteristic of this pattern. You can customize the selection message used
+        by the group manager when selecting the next agent.
+
+        Args:
+            initial_agent: The first agent to speak in the group chat.
+            agents: List of all agents participating in the chat.
+            user_agent: Optional user proxy agent.
+            group_manager_args: Optional arguments for the GroupChatManager.
+            context_variables: Initial context variables for the chat.
+            selection_message: Custom message to use when the group manager is selecting agents.
+            exclude_transit_message: Whether to exclude transit messages from the conversation.
+            summary_method: Method for summarizing the conversation.
+        """
+        # Create the group_manager after_work with the provided selection message
+        group_manager_after_work = GroupManagerTarget(selection_message=selection_message)
+
+        super().__init__(
+            initial_agent=initial_agent,
+            agents=agents,
+            user_agent=user_agent,
+            group_manager_args=group_manager_args,
+            context_variables=context_variables,
+            group_after_work=group_manager_after_work,
+            exclude_transit_message=exclude_transit_message,
+            summary_method=summary_method,
+        )
+
+        # Store the selection message for potential use
+        self.selection_message = selection_message
+
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        Any,
+        list[str],
+        list[Any],
+    ]:
+        """Prepare the group chat for organic agent selection.
+
+        Ensures that:
+        1. The group manager has a valid LLM config
+        2. All agents have appropriate descriptions for the group manager to use
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing all necessary components for the group chat.
+        """
+        # Validate that group_manager_args has an LLM config which is required for this pattern
+        if not self.group_manager_args.get("llm_config", False):
+            # Check if any agent has an LLM config we can use
+            has_llm_config = any(getattr(agent, "llm_config", False) for agent in self.agents)
+
+            if not has_llm_config:
+                raise ValueError(
+                    "AutoPattern requires the group_manager_args to include an llm_config, "
+                    "or at least one agent to have an llm_config"
+                )
+
+        # Check that all agents have descriptions for effective group manager selection
+        for agent in self.agents:
+            if not hasattr(agent, "description") or not agent.description:
+                agent.description = f"Agent {agent.name}"
+
+        # Use the parent class's implementation to prepare the agents and group chat
+        components = super().prepare_group_chat(
+            max_rounds=max_rounds,
+            messages=messages,
+        )
+
+        # Extract the group_after_work and the rest of the components
+        (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            _,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        ) = components
+
+        # Ensure we're using the group_manager after_work
+        group_after_work = self.group_after_work
+
+        # Return all components with our group_after_work
+        return (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/manual.py b/mm_agents/coact/autogen/agentchat/group/patterns/manual.py
new file mode 100644
index 0000000..3d9c90c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/manual.py
@@ -0,0 +1,176 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Callable, Optional, Tuple, Union
+
+from ..context_variables import ContextVariables
+from ..group_tool_executor import GroupToolExecutor
+from ..targets.transition_target import AskUserTarget, TransitionTarget
+from .pattern import Pattern
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat, GroupChatManager
+
+
+class ManualPattern(Pattern):
+    """ManualPattern will ask the user to nominate the next agent to speak at each turn."""
+
+    def __init__(
+        self,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"] = None,
+        group_manager_args: Optional[dict[str, Any]] = None,
+        context_variables: Optional[ContextVariables] = None,
+        exclude_transit_message: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = "last_msg",
+    ):
+        """Initialize the ManualPattern.
+
+        The after_work is always set to ask_user, which will prompt the user for the next agent
+
+        Args:
+            initial_agent: The first agent to speak in the group chat.
+            agents: List of all agents participating in the chat.
+            user_agent: Optional user proxy agent.
+            group_manager_args: Optional arguments for the GroupChatManager.
+            context_variables: Initial context variables for the chat.
+            exclude_transit_message: Whether to exclude transit messages from the conversation.
+            summary_method: Method for summarizing the conversation.
+        """
+        # The group after work will be to ask the user
+        group_after_work = AskUserTarget()
+
+        super().__init__(
+            initial_agent=initial_agent,
+            agents=agents,
+            user_agent=user_agent,
+            group_manager_args=group_manager_args,
+            context_variables=context_variables,
+            group_after_work=group_after_work,
+            exclude_transit_message=exclude_transit_message,
+            summary_method=summary_method,
+        )
+
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        Any,
+        list[str],
+        list[Any],
+    ]:
+        """Prepare the group chat for organic agent selection.
+
+        Ensures that:
+        1. The group manager has a valid LLM config
+        2. All agents have appropriate descriptions for the group manager to use
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing all necessary components for the group chat.
+        """
+        # Use the parent class's implementation to prepare the agents and group chat
+        components = super().prepare_group_chat(
+            max_rounds=max_rounds,
+            messages=messages,
+        )
+
+        # Extract the group_after_work and the rest of the components
+        (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            _,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        ) = components
+
+        # Ensure we're using the group_manager after_work
+        group_after_work = self.group_after_work
+
+        # Set up the allowed speaker transitions to exclude user_agent and GroupToolExecutor
+        self._setup_allowed_transitions(groupchat, user_agent, tool_executor)
+
+        # Return all components with our group_after_work
+        return (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )
+
+    def _setup_allowed_transitions(
+        self, groupchat: "GroupChat", user_agent: Optional["ConversableAgent"], tool_executor: "GroupToolExecutor"
+    ) -> None:
+        """Set up the allowed speaker transitions for the group chat so that when a user selects the next agent the tool executor and user agent don't appear as options.
+
+        Creates transitions where:
+        1. Any agent can speak after any other agent, including themselves
+        2. The user_agent and GroupToolExecutor are excluded from transitions
+
+        Args:
+            groupchat: The GroupChat instance to configure
+            user_agent: The user agent to exclude from transitions
+            tool_executor: The GroupToolExecutor to exclude from transitions
+        """
+        # NOTE: THIS IS NOT WORKING - THE TRANSITIONS ARE NOT BEING KEPT?!
+        """
+        # Get all agents in the group chat
+        all_agents = groupchat.agents
+
+        # Filter out user_agent and group tool executor
+        eligible_agents = []
+        for agent in all_agents:
+            # Skip user_agent
+            if agent == user_agent:
+                continue
+
+            # Skip GroupToolExecutor
+            if isinstance(agent, GroupToolExecutor):
+                continue
+
+            eligible_agents.append(agent)
+
+        # Create a fully connected graph among eligible agents
+        # Each agent can be followed by any other eligible agent
+        allowed_transitions = {}
+        for agent in eligible_agents:
+            # For each agent, every other eligible agent can follow
+            allowed_transitions[agent] = eligible_agents
+
+        # Set the transitions in the group chat
+        groupchat.allowed_speaker_transitions_dict = allowed_transitions
+        """
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/pattern.py b/mm_agents/coact/autogen/agentchat/group/patterns/pattern.py
new file mode 100644
index 0000000..6c0d748
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/pattern.py
@@ -0,0 +1,294 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Patterns of agent orchestrations
+# Uses the group chat or the agents' handoffs to create a pattern
+
+from abc import ABC, abstractmethod
+from typing import TYPE_CHECKING, Any, Callable, Optional, Tuple, Union
+
+from ..context_variables import ContextVariables
+from ..group_utils import (
+    create_group_manager,
+    create_group_transition,
+    link_agents_to_group_manager,
+    prepare_group_agents,
+    process_initial_messages,
+    setup_context_variables,
+)
+from ..targets.transition_target import TerminateTarget, TransitionTarget
+
+if TYPE_CHECKING:
+    from ...agent import Agent
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat, GroupChatManager
+    from ..group_tool_executor import GroupToolExecutor
+
+
+class Pattern(ABC):
+    """Base abstract class for all orchestration patterns.
+
+    Patterns provide a reusable way to define how agents interact within a group chat.
+    Each pattern encapsulates the logic for setting up agents, configuring handoffs,
+    and determining the flow of conversation.
+
+    This is an abstract base class and should not be instantiated directly.
+    Use one of the concrete pattern implementations like AutoPattern,
+    RoundRobinPattern, RandomPattern, or ManualPattern.
+    """
+
+    def __init__(
+        self,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"] = None,
+        group_manager_args: Optional[dict[str, Any]] = None,
+        context_variables: Optional[ContextVariables] = None,
+        group_after_work: Optional[TransitionTarget] = None,
+        exclude_transit_message: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = "last_msg",
+    ):
+        """Initialize the pattern with the required components.
+
+        Args:
+            initial_agent: The first agent to speak in the group chat.
+            agents: List of all agents participating in the chat.
+            user_agent: Optional user proxy agent.
+            group_manager_args: Optional arguments for the GroupChatManager.
+            context_variables: Initial context variables for the chat.
+            group_after_work: Default after work transition behavior when no specific next agent is determined.
+            exclude_transit_message: Whether to exclude transit messages from the conversation.
+            summary_method: Method for summarizing the conversation.
+        """
+        self.initial_agent = initial_agent
+        self.agents = agents
+        self.user_agent = user_agent
+        self.group_manager_args = group_manager_args or {}
+        self.context_variables = context_variables or ContextVariables()
+        self.group_after_work = group_after_work if group_after_work is not None else TerminateTarget()
+        self.exclude_transit_message = exclude_transit_message
+        self.summary_method = summary_method
+
+    @abstractmethod
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        "ConversableAgent",
+        list[str],
+        list["Agent"],
+    ]:
+        """Prepare the group chat for orchestration.
+
+        This is the main method called by initiate_group_chat to set up the pattern.
+        Subclasses must implement or extend this method to define pattern-specific behavior.
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing:
+            - List of agents involved in the group chat
+            - List of wrapped agents
+            - User agent, if applicable
+            - Context variables for the group chat
+            - Initial agent for the group chat
+            - Group-level after work transition for the group chat
+            - Tool executor for the group chat
+            - GroupChat instance
+            - GroupChatManager instance
+            - Processed messages
+            - Last agent to speak
+            - List of group agent names
+            - List of temporary user agents
+        """
+        from ...groupchat import GroupChat
+
+        # Prepare the agents using the existing helper function
+        tool_executor, wrapped_agents = prepare_group_agents(
+            self.agents, self.context_variables, self.exclude_transit_message
+        )
+
+        # Process the initial messages BEFORE creating the GroupChat
+        # This will create a temporary user agent if needed
+        processed_messages, last_agent, group_agent_names, temp_user_list = process_initial_messages(
+            messages, self.user_agent, self.agents, wrapped_agents
+        )
+
+        # Create transition function (has enclosed state for initial agent)
+        group_transition = create_group_transition(
+            initial_agent=self.initial_agent,
+            tool_execution=tool_executor,
+            group_agent_names=group_agent_names,
+            user_agent=self.user_agent,
+            group_after_work=self.group_after_work,
+        )
+
+        # Create the group chat - now we use temp_user_list if no user_agent
+        groupchat = GroupChat(
+            agents=[tool_executor]
+            + self.agents
+            + wrapped_agents
+            + ([self.user_agent] if self.user_agent else temp_user_list),
+            messages=[],
+            max_round=max_rounds,
+            speaker_selection_method=group_transition,
+        )
+
+        # Create the group manager
+        manager = create_group_manager(groupchat, self.group_manager_args, self.agents, self.group_after_work)
+
+        # Point all agent's context variables to this function's context_variables
+        setup_context_variables(
+            tool_execution=tool_executor,
+            agents=self.agents,
+            manager=manager,
+            user_agent=self.user_agent,
+            context_variables=self.context_variables,
+        )
+
+        # Link all agents with the GroupChatManager to allow access to the group chat
+        link_agents_to_group_manager(groupchat.agents, manager)
+
+        return (
+            self.agents,
+            wrapped_agents,
+            self.user_agent,
+            self.context_variables,
+            self.initial_agent,
+            self.group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )  # type: ignore[return-value]
+
+    @classmethod
+    def create_default(
+        cls,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"] = None,
+        group_manager_args: Optional[dict[str, Any]] = None,
+        context_variables: Optional[ContextVariables] = None,
+        exclude_transit_message: bool = True,
+        summary_method: Optional[Union[str, Callable[..., Any]]] = "last_msg",
+    ) -> "DefaultPattern":
+        """Create a default pattern with minimal configuration.
+
+        This replaces the need for a separate BasePattern class by providing
+        a factory method that creates a simple DefaultPattern instance.
+
+        Args:
+            initial_agent: The first agent to speak in the group chat.
+            agents: List of all agents participating in the chat.
+            user_agent: Optional user proxy agent.
+            group_manager_args: Optional arguments for the GroupChatManager.
+            context_variables: Initial context variables for the chat.
+            exclude_transit_message: Whether to exclude transit messages from the conversation.
+            summary_method: Method for summarizing the conversation.
+
+        Returns:
+            A DefaultPattern instance with basic configuration.
+        """
+        return DefaultPattern(
+            initial_agent=initial_agent,
+            agents=agents,
+            user_agent=user_agent,
+            group_manager_args=group_manager_args,
+            context_variables=context_variables,
+            exclude_transit_message=exclude_transit_message,
+            summary_method=summary_method,
+        )
+
+
+class DefaultPattern(Pattern):
+    """DefaultPattern implements a minimal pattern for simple agent interactions.
+
+    This replaces the previous BasePattern and provides a concrete implementation
+    of the Pattern abstract base class.
+    """
+
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        Any,
+        list[str],
+        list[Any],
+    ]:
+        """Prepare the group chat with default configuration.
+
+        This implementation calls the parent class method but ensures that
+        the group_after_work in the returned tuple is the pattern's own.
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing all necessary components for the group chat.
+        """
+        # Use the parent class's implementation to prepare the agents and group chat
+        (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            _,  # Ignore the group_after_work from parent
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        ) = super().prepare_group_chat(
+            max_rounds=max_rounds,
+            messages=messages,
+        )
+
+        # Return all components with our group_after_work
+        return (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            self.group_after_work,  # Use our own group_after_work
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/random.py b/mm_agents/coact/autogen/agentchat/group/patterns/random.py
new file mode 100644
index 0000000..24138ed
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/random.py
@@ -0,0 +1,106 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Optional, Tuple, Union
+
+from ..context_variables import ContextVariables
+from ..targets.transition_target import RandomAgentTarget, TransitionTarget
+from .pattern import Pattern
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat, GroupChatManager
+    from ..group_tool_executor import GroupToolExecutor
+
+
+class RandomPattern(Pattern):
+    """RandomPattern implements a random agent selection process."""
+
+    def _generate_handoffs(
+        self,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"],
+    ) -> None:
+        """Generate handoffs between agents in a random fashion."""
+        agent_list = agents + ([user_agent] if user_agent is not None else [])
+
+        for agent in agent_list:
+            # Get the list of agents except itself
+            other_agents = [a for a in agent_list if a != agent]
+
+            # Create a random after work
+            agent.handoffs.set_after_work(target=RandomAgentTarget(agents=other_agents))
+
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        Any,
+        list[str],
+        list[Any],
+    ]:
+        """Prepare the group chat for organic agent selection.
+
+        Ensures that:
+        1. The group manager has a valid LLM config
+        2. All agents have appropriate descriptions for the group manager to use
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing all necessary components for the group chat.
+        """
+        # Use the parent class's implementation to prepare the agents and group chat
+        (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        ) = super().prepare_group_chat(
+            max_rounds=max_rounds,
+            messages=messages,
+        )
+
+        # Create the random handoffs between agents
+        self._generate_handoffs(initial_agent=initial_agent, agents=agents, user_agent=user_agent)
+
+        # Return all components with our group_after_work
+        return (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )
diff --git a/mm_agents/coact/autogen/agentchat/group/patterns/round_robin.py b/mm_agents/coact/autogen/agentchat/group/patterns/round_robin.py
new file mode 100644
index 0000000..9ecbaae
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/patterns/round_robin.py
@@ -0,0 +1,117 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Optional, Tuple, Union
+
+from ..context_variables import ContextVariables
+from ..targets.transition_target import AgentTarget, TransitionTarget
+from .pattern import Pattern
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat, GroupChatManager
+    from ..group_tool_executor import GroupToolExecutor
+
+
+class RoundRobinPattern(Pattern):
+    """RoundRobinPattern implements a round robin with handoffs between agents."""
+
+    def _generate_handoffs(
+        self,
+        initial_agent: "ConversableAgent",
+        agents: list["ConversableAgent"],
+        user_agent: Optional["ConversableAgent"],
+    ) -> None:
+        """Generate handoffs between agents in a round-robin fashion."""
+        # Create a list of the agents and the user_agent but put the initial_agent first
+        agent_list = [initial_agent]
+
+        # Add the rest of the agents, excluding the initial_agent and user_agent
+        for agent in agents:
+            if agent != initial_agent and (user_agent is None or agent != user_agent):
+                agent_list.append(agent)
+
+        # Add the user_agent last if it exists
+        if user_agent is not None:
+            agent_list.append(user_agent)
+
+        # Create handoffs in a round-robin fashion
+        for i, agent in enumerate(agent_list):
+            # Last agent hands off to the first agent
+            # Otherwise agent hands off to the next one
+            handoff_target = agent_list[0] if i == len(agent_list) - 1 else agent_list[i + 1]
+
+            agent.handoffs.set_after_work(target=AgentTarget(agent=handoff_target))
+
+    def prepare_group_chat(
+        self,
+        max_rounds: int,
+        messages: Union[list[dict[str, Any]], str],
+    ) -> Tuple[
+        list["ConversableAgent"],
+        list["ConversableAgent"],
+        Optional["ConversableAgent"],
+        ContextVariables,
+        "ConversableAgent",
+        TransitionTarget,
+        "GroupToolExecutor",
+        "GroupChat",
+        "GroupChatManager",
+        list[dict[str, Any]],
+        Any,
+        list[str],
+        list[Any],
+    ]:
+        """Prepare the group chat for organic agent selection.
+
+        Ensures that:
+        1. The group manager has a valid LLM config
+        2. All agents have appropriate descriptions for the group manager to use
+
+        Args:
+            max_rounds: Maximum number of conversation rounds.
+            messages: Initial message(s) to start the conversation.
+
+        Returns:
+            Tuple containing all necessary components for the group chat.
+        """
+        # Use the parent class's implementation to prepare the agents and group chat
+        (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        ) = super().prepare_group_chat(
+            max_rounds=max_rounds,
+            messages=messages,
+        )
+
+        # Create the handoffs between agents
+        self._generate_handoffs(initial_agent=initial_agent, agents=agents, user_agent=user_agent)
+
+        # Return all components with our group_after_work
+        return (
+            agents,
+            wrapped_agents,
+            user_agent,
+            context_variables,
+            initial_agent,
+            group_after_work,
+            tool_executor,
+            groupchat,
+            manager,
+            processed_messages,
+            last_agent,
+            group_agent_names,
+            temp_user_list,
+        )
diff --git a/mm_agents/coact/autogen/agentchat/group/reply_result.py b/mm_agents/coact/autogen/agentchat/group/reply_result.py
new file mode 100644
index 0000000..7ee8e02
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/reply_result.py
@@ -0,0 +1,26 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+__all__ = ["ReplyResult"]
+
+
+from typing import Optional
+
+from pydantic import BaseModel
+
+from .context_variables import ContextVariables
+from .targets.transition_target import TransitionTarget
+
+
+class ReplyResult(BaseModel):
+    """Result of a tool call that is used to provide the return message and the target to transition to."""
+
+    message: str
+    target: Optional[TransitionTarget] = None
+    context_variables: Optional[ContextVariables] = None
+
+    def __str__(self) -> str:
+        """The string representation for ReplyResult will be just the message."""
+        return self.message
diff --git a/mm_agents/coact/autogen/agentchat/group/speaker_selection_result.py b/mm_agents/coact/autogen/agentchat/group/speaker_selection_result.py
new file mode 100644
index 0000000..9c8ba11
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/speaker_selection_result.py
@@ -0,0 +1,41 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Optional, Union
+
+from pydantic import BaseModel
+
+from ..agent import Agent
+
+if TYPE_CHECKING:
+    # Avoid circular import
+    from ..groupchat import GroupChat
+
+
+class SpeakerSelectionResult(BaseModel):
+    """Represents a speaker selection result that will be returned to GroupChat._prepare_and_select_agents to determine the next speaker.
+
+    This class can return an Agent, a None to end the conversation, or a string for a speaker selection method.
+    """
+
+    terminate: Optional[bool] = None
+    agent_name: Optional[str] = None
+    speaker_selection_method: Optional[str] = None
+
+    def get_speaker_selection_result(self, groupchat: "GroupChat") -> Optional[Union[Agent, str]]:
+        """Get the speaker selection result. If None, the conversation will end."""
+        if self.agent_name is not None:
+            # Find the agent by name in the groupchat
+            for agent in groupchat.agents:
+                if agent.name == self.agent_name:
+                    return agent
+            raise ValueError(f"Agent '{self.agent_name}' not found in groupchat.")
+        elif self.speaker_selection_method is not None:
+            return self.speaker_selection_method
+        elif self.terminate is not None and self.terminate:
+            return None
+        else:
+            raise ValueError(
+                "Unable to establish speaker selection result. No terminate, agent, or speaker selection method provided."
+            )
diff --git a/mm_agents/coact/autogen/agentchat/group/targets/__init__.py b/mm_agents/coact/autogen/agentchat/group/targets/__init__.py
new file mode 100644
index 0000000..78d5382
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/targets/__init__.py
@@ -0,0 +1,4 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/mm_agents/coact/autogen/agentchat/group/targets/group_chat_target.py b/mm_agents/coact/autogen/agentchat/group/targets/group_chat_target.py
new file mode 100644
index 0000000..62ed046
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/targets/group_chat_target.py
@@ -0,0 +1,132 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Optional, Union
+
+from pydantic import BaseModel
+
+from ....doc_utils import export_module
+from ...agent import Agent
+from ..speaker_selection_result import SpeakerSelectionResult
+from .transition_target import AgentTarget, TransitionTarget
+from .transition_utils import __AGENT_WRAPPER_PREFIX__
+
+if TYPE_CHECKING:
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat
+    from ..patterns.pattern import Pattern
+
+
+__all__ = ["GroupChatConfig", "GroupChatTarget"]
+
+
+@export_module("autogen.agentchat.group")
+class GroupChatConfig(BaseModel):
+    """Configuration for a group chat transition target.
+
+    Note: If context_variables are not passed in, the outer context variables will be passed in"""
+
+    pattern: "Pattern"
+    messages: Union[list[dict[str, Any]], str]
+    max_rounds: int = 20
+
+
+@export_module("autogen.agentchat.group")
+class GroupChatTarget(TransitionTarget):
+    """Target that represents a group chat."""
+
+    group_chat_config: GroupChatConfig
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection. For GroupChatTarget the chat must be encapsulated into an agent."""
+        return False
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the nested chat configuration."""
+        raise NotImplementedError(
+            "GroupChatTarget does not support the resolve method. An agent should be used to encapsulate this nested chat and then the target changed to an AgentTarget."
+        )
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "a group chat"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling."""
+        return "group_chat"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Transfer to group chat"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent. GroupChatTarget must be wrapped in an agent."""
+        return True
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the group chat."""
+        from autogen.agentchat import initiate_group_chat
+
+        from ...conversable_agent import ConversableAgent  # to avoid circular import
+
+        # Create the wrapper agent with a name that identifies it as a wrapped group chat
+        group_chat_agent = ConversableAgent(
+            name=f"{__AGENT_WRAPPER_PREFIX__}group_{parent_agent.name}_{index + 1}",
+            # Copy LLM config from parent agent to ensure it can generate replies if needed
+            llm_config=parent_agent.llm_config,
+        )
+
+        # Store the config directly on the agent
+        group_chat_agent._group_chat_config = self.group_chat_config  # type: ignore[attr-defined]
+
+        # Define the reply function that will run the group chat
+        def group_chat_reply(
+            agent: "ConversableAgent",
+            messages: Optional[list[dict[str, Any]]] = None,
+            sender: Optional["Agent"] = None,
+            config: Optional[Any] = None,
+        ) -> tuple[bool, Optional[dict[str, Any]]]:
+            """Run the inner group chat and return its results as a reply."""
+            # Get the configuration stored directly on the agent
+            group_config = agent._group_chat_config  # type: ignore[attr-defined]
+
+            # Pull through the second last message from the outer chat (the last message will be the handoff message)
+            # This may need work to make sure we get the right message(s) from the outer chat
+            message = (
+                messages[-2]["content"]
+                if messages and len(messages) >= 2 and "content" in messages[-2]
+                else "No message to pass through."
+            )
+
+            try:
+                # Run the group chat with direct agent references from the config
+                result, _, _ = initiate_group_chat(
+                    pattern=group_config.pattern,
+                    messages=message,
+                    max_rounds=group_config.max_rounds,
+                )
+
+                # Return the summary from the chat result summary
+                return True, {"content": result.summary}
+
+            except Exception as e:
+                # Handle any errors during execution
+                return True, {"content": f"Error running group chat: {str(e)}"}
+
+        # Register the reply function with the wrapper agent
+        group_chat_agent.register_reply(
+            trigger=[ConversableAgent, None],
+            reply_func=group_chat_reply,
+            remove_other_reply_funcs=True,  # Use only this reply function
+        )
+
+        # After the group chat completes, transition back to the parent agent
+        group_chat_agent.handoffs.set_after_work(AgentTarget(parent_agent))
+
+        return group_chat_agent
diff --git a/mm_agents/coact/autogen/agentchat/group/targets/group_manager_target.py b/mm_agents/coact/autogen/agentchat/group/targets/group_manager_target.py
new file mode 100644
index 0000000..3aab182
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/targets/group_manager_target.py
@@ -0,0 +1,151 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Any, Optional, Type, Union
+
+from pydantic import BaseModel, field_validator
+
+from ....doc_utils import export_module
+from ..context_str import ContextStr
+from ..group_tool_executor import GroupToolExecutor
+from ..speaker_selection_result import SpeakerSelectionResult
+from .transition_target import TransitionTarget
+from .transition_utils import __AGENT_WRAPPER_PREFIX__
+
+if TYPE_CHECKING:
+    # Avoid circular import
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat
+
+__all__ = ["GroupManagerTarget"]
+
+
+def prepare_groupchat_auto_speaker(
+    groupchat: "GroupChat",
+    last_group_agent: "ConversableAgent",
+    group_chat_manager_selection_msg: Optional[Any],
+) -> None:
+    """Prepare the group chat for auto speaker selection, includes updating or restore the groupchat speaker selection message.
+
+    Tool Executor and wrapped agents will be removed from the available agents list.
+
+    Args:
+        groupchat (GroupChat): GroupChat instance.
+        last_group_agent ("ConversableAgent"): The last group agent for which the LLM config is used
+        group_chat_manager_selection_msg (GroupManagerSelectionMessage): Optional message to use for the agent selection (in internal group chat).
+    """
+    from ...groupchat import SELECT_SPEAKER_PROMPT_TEMPLATE
+
+    def substitute_agentlist(template: str) -> str:
+        # Run through group chat's string substitution first for {agentlist}
+        # We need to do this so that the next substitution doesn't fail with agentlist
+        # and we can remove the tool executor and wrapped chats from the available agents list
+        agent_list = [
+            agent
+            for agent in groupchat.agents
+            if not isinstance(agent, GroupToolExecutor) and not agent.name.startswith(__AGENT_WRAPPER_PREFIX__)
+        ]
+
+        groupchat.select_speaker_prompt_template = template
+        return groupchat.select_speaker_prompt(agent_list)
+
+    # Use the default speaker selection prompt if one is not specified, otherwise use the specified one
+    groupchat.select_speaker_prompt_template = substitute_agentlist(
+        SELECT_SPEAKER_PROMPT_TEMPLATE
+        if group_chat_manager_selection_msg is None
+        else group_chat_manager_selection_msg.get_message(last_group_agent)
+    )
+
+
+# GroupManagerSelectionMessage protocol and implementations
+@export_module("autogen.agentchat.group")
+class GroupManagerSelectionMessage(BaseModel):
+    """Base class for all GroupManager selection message types."""
+
+    def get_message(self, agent: "ConversableAgent") -> str:
+        """Get the formatted message."""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+
+@export_module("autogen.agentchat.group")
+class GroupManagerSelectionMessageString(GroupManagerSelectionMessage):
+    """Selection message that uses a plain string template."""
+
+    message: str
+
+    def get_message(self, agent: "ConversableAgent") -> str:
+        """Get the message string."""
+        return self.message
+
+
+@export_module("autogen.agentchat.group")
+class GroupManagerSelectionMessageContextStr(GroupManagerSelectionMessage):
+    """Selection message that uses a ContextStr template."""
+
+    context_str_template: str
+
+    # We will replace {agentlist} with another term and return it later for use with the internal group chat auto speaker selection
+    # Otherwise our format will fail
+    @field_validator("context_str_template", mode="before")
+    def _replace_agentlist_placeholder(cls: Type["GroupManagerSelectionMessageContextStr"], v: Any) -> Union[str, Any]:  # noqa: N805
+        """Replace {agentlist} placeholder before validation/assignment."""
+        if isinstance(v, str):
+            if "{agentlist}" in v:
+                return v.replace("{agentlist}", "<<agent_list>>")  # Perform the replacement
+            else:
+                return v  # If no replacement is needed, return the original value
+        return ""
+
+    def get_message(self, agent: "ConversableAgent") -> str:
+        """Get the formatted message with context variables substituted."""
+        context_str = ContextStr(template=self.context_str_template)
+        format_result = context_str.format(agent.context_variables)
+        if format_result is None:
+            return ""
+
+        return format_result.replace(
+            "<<agent_list>>", "{agentlist}"
+        )  # Restore agentlist so it can be substituted by the internal group chat auto speaker selection
+
+
+class GroupManagerTarget(TransitionTarget):
+    """Target that represents an agent by name."""
+
+    selection_message: Optional[GroupManagerSelectionMessage] = None
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the speaker selection for the group."""
+        if self.selection_message is not None:
+            prepare_groupchat_auto_speaker(groupchat, current_agent, self.selection_message)
+
+        return SpeakerSelectionResult(speaker_selection_method="auto")
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "the group manager"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return self.display_name()
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Transfer to the group manager"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("GroupManagerTarget does not require wrapping in an agent.")
diff --git a/mm_agents/coact/autogen/agentchat/group/targets/transition_target.py b/mm_agents/coact/autogen/agentchat/group/targets/transition_target.py
new file mode 100644
index 0000000..eb7ac0f
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/targets/transition_target.py
@@ -0,0 +1,413 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import random
+from typing import TYPE_CHECKING, Any, Optional
+
+from pydantic import BaseModel
+
+from ..speaker_selection_result import SpeakerSelectionResult
+from .transition_utils import __AGENT_WRAPPER_PREFIX__
+
+if TYPE_CHECKING:
+    # Avoid circular import
+    from ...conversable_agent import ConversableAgent
+    from ...groupchat import GroupChat
+
+__all__ = [
+    "AgentNameTarget",
+    "AgentTarget",
+    "AskUserTarget",
+    "NestedChatTarget",
+    "RandomAgentTarget",
+    "RevertToUserTarget",
+    "StayTarget",
+    "TerminateTarget",
+    "TransitionTarget",
+]
+
+# Common options for transitions
+# terminate: Terminate the conversation
+# revert_to_user: Revert to the user agent
+# stay: Stay with the current agent
+# group_manager: Use the group manager (auto speaker selection)
+# ask_user: Use the user manager (ask the user, aka manual)
+# TransitionOption = Literal["terminate", "revert_to_user", "stay", "group_manager", "ask_user"]
+
+
+class TransitionTarget(BaseModel):
+    """Base class for all transition targets across OnCondition, OnContextCondition, and after work."""
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve to an option for speaker selection (Agent, 'None' to end, Str for speaker selection method). In the case of a nested chat, this will return False as it should be encapsulated in an agent."""
+        return False
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to a speaker selection result (Agent, None for termination, or str for speaker selection method)."""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("Requires subclasses to implement.")
+
+
+class AgentTarget(TransitionTarget):
+    """Target that represents a direct agent reference."""
+
+    agent_name: str
+
+    def __init__(self, agent: "ConversableAgent", **data: Any) -> None:  # type: ignore[no-untyped-def]
+        # Store the name from the agent for serialization
+        super().__init__(agent_name=agent.name, **data)
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the actual agent object from the groupchat."""
+        return SpeakerSelectionResult(agent_name=self.agent_name)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return f"{self.agent_name}"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return self.display_name()
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return f"Transfer to {self.agent_name}"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("AgentTarget does not require wrapping in an agent.")
+
+
+class AgentNameTarget(TransitionTarget):
+    """Target that represents an agent by name."""
+
+    agent_name: str
+
+    def __init__(self, agent_name: str, **data: Any) -> None:
+        """Initialize with agent name as a positional parameter."""
+        super().__init__(agent_name=agent_name, **data)
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the agent name string."""
+        return SpeakerSelectionResult(agent_name=self.agent_name)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return f"{self.agent_name}"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return self.display_name()
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return f"Transfer to {self.agent_name}"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("AgentNameTarget does not require wrapping in an agent.")
+
+
+class NestedChatTarget(TransitionTarget):
+    """Target that represents a nested chat configuration."""
+
+    nested_chat_config: dict[str, Any]
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection. For NestedChatTarget the nested chat must be encapsulated into an agent."""
+        return False
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the nested chat configuration."""
+        raise NotImplementedError(
+            "NestedChatTarget does not support the resolve method. An agent should be used to encapsulate this nested chat and then the target changed to an AgentTarget."
+        )
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "a nested chat"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return "nested_chat"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Transfer to nested chat"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent. NestedChatTarget must be wrapped in an agent."""
+        return True
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the nested chat."""
+        from ...conversable_agent import ConversableAgent  # to avoid circular import - NEED SOLUTION
+
+        nested_chat_agent = ConversableAgent(name=f"{__AGENT_WRAPPER_PREFIX__}nested_{parent_agent.name}_{index + 1}")
+
+        nested_chat_agent.register_nested_chats(
+            self.nested_chat_config["chat_queue"],
+            reply_func_from_nested_chats=self.nested_chat_config.get("reply_func_from_nested_chats")
+            or "summary_from_nested_chats",
+            config=self.nested_chat_config.get("config"),
+            trigger=lambda sender: True,
+            position=0,
+            use_async=self.nested_chat_config.get("use_async", False),
+        )
+
+        # After the nested chat is complete, transfer back to the parent agent
+        nested_chat_agent.handoffs.set_after_work(AgentTarget(parent_agent))
+
+        return nested_chat_agent
+
+
+class TerminateTarget(TransitionTarget):
+    """Target that represents a termination of the conversation."""
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to termination."""
+        return SpeakerSelectionResult(terminate=True)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "Terminate"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return "terminate"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Terminate"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("TerminateTarget does not require wrapping in an agent.")
+
+
+class StayTarget(TransitionTarget):
+    """Target that represents staying with the current agent."""
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to staying with the current agent."""
+        return SpeakerSelectionResult(agent_name=current_agent.name)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "Stay"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return "stay"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Stay with agent"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("StayTarget does not require wrapping in an agent.")
+
+
+class RevertToUserTarget(TransitionTarget):
+    """Target that represents reverting to the user agent."""
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to reverting to the user agent."""
+        if user_agent is None:
+            raise ValueError("User agent must be provided to the chat for the revert_to_user option.")
+        return SpeakerSelectionResult(agent_name=user_agent.name)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "Revert to User"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return "revert_to_user"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Revert to User"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("RevertToUserTarget does not require wrapping in an agent.")
+
+
+class AskUserTarget(TransitionTarget):
+    """Target that represents asking the user for input."""
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to asking the user for input."""
+        return SpeakerSelectionResult(speaker_selection_method="manual")
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return "Ask User"
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return "ask_user"
+
+    def __str__(self) -> str:
+        """String representation for AgentTarget, can be shown as a function call message."""
+        return "Ask User"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("AskUserTarget does not require wrapping in an agent.")
+
+
+class RandomAgentTarget(TransitionTarget):
+    """Target that represents a random selection from a list of agents."""
+
+    agent_names: list[str]
+    nominated_name: str = "<Not Randomly Selected Yet>"
+
+    def __init__(self, agents: list["ConversableAgent"], **data: Any) -> None:  # type: ignore[no-untyped-def]
+        # Store the name from the agent for serialization
+        super().__init__(agent_names=[agent.name for agent in agents], **data)
+
+    def can_resolve_for_speaker_selection(self) -> bool:
+        """Check if the target can resolve for speaker selection."""
+        return True
+
+    def resolve(
+        self,
+        groupchat: "GroupChat",
+        current_agent: "ConversableAgent",
+        user_agent: Optional["ConversableAgent"],
+    ) -> SpeakerSelectionResult:
+        """Resolve to the actual agent object from the groupchat, choosing a random agent (except the current one)"""
+        # Randomly select the next agent
+        self.nominated_name = random.choice([name for name in self.agent_names if name != current_agent.name])
+
+        return SpeakerSelectionResult(agent_name=self.nominated_name)
+
+    def display_name(self) -> str:
+        """Get the display name for the target."""
+        return self.nominated_name
+
+    def normalized_name(self) -> str:
+        """Get a normalized name for the target that has no spaces, used for function calling"""
+        return self.display_name()
+
+    def __str__(self) -> str:
+        """String representation for RandomAgentTarget, can be shown as a function call message."""
+        return f"Transfer to {self.nominated_name}"
+
+    def needs_agent_wrapper(self) -> bool:
+        """Check if the target needs to be wrapped in an agent."""
+        return False
+
+    def create_wrapper_agent(self, parent_agent: "ConversableAgent", index: int) -> "ConversableAgent":
+        """Create a wrapper agent for the target if needed."""
+        raise NotImplementedError("RandomAgentTarget does not require wrapping in an agent.")
+
+
+# TODO: Consider adding a SequentialChatTarget class
diff --git a/mm_agents/coact/autogen/agentchat/group/targets/transition_utils.py b/mm_agents/coact/autogen/agentchat/group/targets/transition_utils.py
new file mode 100644
index 0000000..fd904d4
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/group/targets/transition_utils.py
@@ -0,0 +1,6 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Prefix for all wrapped agent names
+__AGENT_WRAPPER_PREFIX__ = "wrapped_"
diff --git a/mm_agents/coact/autogen/agentchat/groupchat.py b/mm_agents/coact/autogen/agentchat/groupchat.py
new file mode 100644
index 0000000..960bbc2
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/groupchat.py
@@ -0,0 +1,1694 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import copy
+import json
+import logging
+import random
+import re
+import sys
+from dataclasses import dataclass, field
+from typing import Any, Callable, Literal, Optional, Union
+
+from ..code_utils import content_str
+from ..doc_utils import export_module
+from ..events.agent_events import (
+    ClearAgentsHistoryEvent,
+    GroupChatResumeEvent,
+    GroupChatRunChatEvent,
+    SelectSpeakerEvent,
+    SelectSpeakerInvalidInputEvent,
+    SelectSpeakerTryCountExceededEvent,
+    SpeakerAttemptFailedMultipleAgentsEvent,
+    SpeakerAttemptFailedNoAgentsEvent,
+    SpeakerAttemptSuccessfulEvent,
+    TerminationEvent,
+)
+from ..exception_utils import AgentNameConflictError, NoEligibleSpeakerError, UndefinedNextAgentError
+from ..graph_utils import check_graph_validity, invert_disallowed_to_allowed
+from ..io.base import IOStream
+from ..llm_config import LLMConfig
+from ..oai.client import ModelClient
+from ..runtime_logging import log_new_agent, logging_enabled
+from .agent import Agent
+from .contrib.capabilities import transform_messages
+from .conversable_agent import ConversableAgent
+
+logger = logging.getLogger(__name__)
+
+SELECT_SPEAKER_PROMPT_TEMPLATE = (
+    "Read the above conversation. Then select the next role from {agentlist} to play. Only return the role."
+)
+
+
+@dataclass
+@export_module("autogen")
+class GroupChat:
+    """(In preview) A group chat class that contains the following data fields:
+    - agents: a list of participating agents.
+    - messages: a list of messages in the group chat.
+    - max_round: the maximum number of rounds.
+    - admin_name: the name of the admin agent if there is one. Default is "Admin".
+        KeyBoardInterrupt will make the admin agent take over.
+    - func_call_filter: whether to enforce function call filter. Default is True.
+        When set to True and when a message is a function call suggestion,
+        the next speaker will be chosen from an agent which contains the corresponding function name
+        in its `function_map`.
+    - select_speaker_message_template: customize the select speaker message (used in "auto" speaker selection), which appears first in the message context and generally includes the agent descriptions and list of agents. If the string contains "`{roles}`" it will replaced with the agent's and their role descriptions. If the string contains "`{agentlist}`" it will be replaced with a comma-separated list of agent names in square brackets. The default value is:
+        "You are in a role play game. The following roles are available:
+                `{roles}`.
+                Read the following conversation.
+                Then select the next role from `{agentlist}` to play. Only return the role."
+    - select_speaker_prompt_template: customize the select speaker prompt (used in "auto" speaker selection), which appears last in the message context and generally includes the list of agents and guidance for the LLM to select the next agent. If the string contains "`{agentlist}`" it will be replaced with a comma-separated list of agent names in square brackets. The default value is:
+        "Read the above conversation. Then select the next role from `{agentlist}` to play. Only return the role."
+        To ignore this prompt being used, set this to None. If set to None, ensure your instructions for selecting a speaker are in the select_speaker_message_template string.
+    - select_speaker_auto_multiple_template: customize the follow-up prompt used when selecting a speaker fails with a response that contains multiple agent names. This prompt guides the LLM to return just one agent name. Applies only to "auto" speaker selection method. If the string contains "`{agentlist}`" it will be replaced with a comma-separated list of agent names in square brackets. The default value is:
+        "You provided more than one name in your text, please return just the name of the next speaker. To determine the speaker use these prioritised rules:
+                1. If the context refers to themselves as a speaker e.g. "As the..." , choose that speaker's name
+                2. If it refers to the "next" speaker name, choose that name
+                3. Otherwise, choose the first provided speaker's name in the context
+                The names are case-sensitive and should not be abbreviated or changed.
+                Respond with ONLY the name of the speaker and DO NOT provide a reason."
+    - select_speaker_auto_none_template: customize the follow-up prompt used when selecting a speaker fails with a response that contains no agent names. This prompt guides the LLM to return an agent name and provides a list of agent names. Applies only to "auto" speaker selection method. If the string contains "`{agentlist}`" it will be replaced with a comma-separated list of agent names in square brackets. The default value is:
+        "You didn't choose a speaker. As a reminder, to determine the speaker use these prioritised rules:
+                1. If the context refers to themselves as a speaker e.g. "As the..." , choose that speaker's name
+                2. If it refers to the "next" speaker name, choose that name
+                3. Otherwise, choose the first provided speaker's name in the context
+                The names are case-sensitive and should not be abbreviated or changed.
+                The only names that are accepted are `{agentlist}`.
+                Respond with ONLY the name of the speaker and DO NOT provide a reason."
+    - speaker_selection_method: the method for selecting the next speaker. Default is "auto".
+        Could be any of the following (case insensitive), will raise ValueError if not recognized:
+        - "auto": the next speaker is selected automatically by LLM.
+        - "manual": the next speaker is selected manually by user input.
+        - "random": the next speaker is selected randomly.
+        - "round_robin": the next speaker is selected in a round robin fashion, i.e., iterating in the same order as provided in `agents`.
+        - a customized speaker selection function (Callable): the function will be called to select the next speaker.
+            The function should take the last speaker and the group chat as input and return one of the following:
+                1. an `Agent` class, it must be one of the agents in the group chat.
+                2. a string from ['auto', 'manual', 'random', 'round_robin'] to select a default method to use.
+                3. None, which would terminate the conversation gracefully.
+            ```python
+            def custom_speaker_selection_func(
+                last_speaker: Agent, groupchat: GroupChat
+            ) -> Union[Agent, str, None]:
+            ```
+    - max_retries_for_selecting_speaker: the maximum number of times the speaker selection requery process will run.
+        If, during speaker selection, multiple agent names or no agent names are returned by the LLM as the next agent, it will be queried again up to the maximum number
+        of times until a single agent is returned or it exhausts the maximum attempts.
+        Applies only to "auto" speaker selection method.
+        Default is 2.
+    - select_speaker_transform_messages: (optional) the message transformations to apply to the nested select speaker agent-to-agent chat messages.
+        Takes a TransformMessages object, defaults to None and is only utilised when the speaker selection method is "auto".
+    - select_speaker_auto_verbose: whether to output the select speaker responses and selections
+        If set to True, the outputs from the two agents in the nested select speaker chat will be output, along with
+        whether the responses were successful, or not, in selecting an agent
+        Applies only to "auto" speaker selection method.
+    - allow_repeat_speaker: whether to allow the same speaker to speak consecutively.
+        Default is True, in which case all speakers are allowed to speak consecutively.
+        If `allow_repeat_speaker` is a list of Agents, then only those listed agents are allowed to repeat.
+        If set to False, then no speakers are allowed to repeat.
+        `allow_repeat_speaker` and `allowed_or_disallowed_speaker_transitions` are mutually exclusive.
+    - allowed_or_disallowed_speaker_transitions: dict.
+        The keys are source agents, and the values are agents that the key agent can/can't transit to,
+        depending on speaker_transitions_type. Default is None, which means all agents can transit to all other agents.
+        `allow_repeat_speaker` and `allowed_or_disallowed_speaker_transitions` are mutually exclusive.
+    - speaker_transitions_type: whether the speaker_transitions_type is a dictionary containing lists of allowed agents or disallowed agents.
+        "allowed" means the `allowed_or_disallowed_speaker_transitions` is a dictionary containing lists of allowed agents.
+        If set to "disallowed", then the `allowed_or_disallowed_speaker_transitions` is a dictionary containing lists of disallowed agents.
+        Must be supplied if `allowed_or_disallowed_speaker_transitions` is not None.
+    - enable_clear_history: enable possibility to clear history of messages for agents manually by providing
+        "clear history" phrase in user prompt. This is experimental feature.
+        See description of GroupChatManager.clear_agents_history function for more info.
+    - send_introductions: send a round of introductions at the start of the group chat, so agents know who they can speak to (default: False)
+    - select_speaker_auto_model_client_cls: Custom model client class for the internal speaker select agent used during 'auto' speaker selection (optional)
+    - select_speaker_auto_llm_config: LLM config for the internal speaker select agent used during 'auto' speaker selection (optional)
+    - role_for_select_speaker_messages: sets the role name for speaker selection when in 'auto' mode, typically 'user' or 'system'. (default: 'system')
+    """
+
+    agents: list[Agent]
+    messages: list[dict[str, Any]] = field(default_factory=list)
+    max_round: int = 10
+    admin_name: str = "Admin"
+    func_call_filter: bool = True
+    speaker_selection_method: Union[Literal["auto", "manual", "random", "round_robin"], Callable[..., Any]] = "auto"
+    max_retries_for_selecting_speaker: int = 2
+    allow_repeat_speaker: Optional[Union[bool, list[Agent]]] = None
+    allowed_or_disallowed_speaker_transitions: Optional[dict[str, Any]] = None
+    speaker_transitions_type: Literal["allowed", "disallowed", None] = None
+    enable_clear_history: bool = False
+    send_introductions: bool = False
+    select_speaker_message_template: str = """You are in a role play game. The following roles are available:
+                {roles}.
+                Read the following conversation.
+                Then select the next role from {agentlist} to play. Only return the role."""
+    select_speaker_prompt_template: str = SELECT_SPEAKER_PROMPT_TEMPLATE
+    select_speaker_auto_multiple_template: str = """You provided more than one name in your text, please return just the name of the next speaker. To determine the speaker use these prioritised rules:
+    1. If the context refers to themselves as a speaker e.g. "As the..." , choose that speaker's name
+    2. If it refers to the "next" speaker name, choose that name
+    3. Otherwise, choose the first provided speaker's name in the context
+    The names are case-sensitive and should not be abbreviated or changed.
+    Respond with ONLY the name of the speaker and DO NOT provide a reason."""
+    select_speaker_auto_none_template: str = """You didn't choose a speaker. As a reminder, to determine the speaker use these prioritised rules:
+    1. If the context refers to themselves as a speaker e.g. "As the..." , choose that speaker's name
+    2. If it refers to the "next" speaker name, choose that name
+    3. Otherwise, choose the first provided speaker's name in the context
+    The names are case-sensitive and should not be abbreviated or changed.
+    The only names that are accepted are {agentlist}.
+    Respond with ONLY the name of the speaker and DO NOT provide a reason."""
+    select_speaker_transform_messages: Optional[transform_messages.TransformMessages] = None
+    select_speaker_auto_verbose: Optional[bool] = False
+    select_speaker_auto_model_client_cls: Optional[Union[ModelClient, list[ModelClient]]] = None
+    select_speaker_auto_llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = None
+    role_for_select_speaker_messages: Optional[str] = "system"
+
+    _VALID_SPEAKER_SELECTION_METHODS = ["auto", "manual", "random", "round_robin"]
+    _VALID_SPEAKER_TRANSITIONS_TYPE = ["allowed", "disallowed", None]
+
+    # Define a class attribute for the default introduction message
+    DEFAULT_INTRO_MSG = (
+        "Hello everyone. We have assembled a great team today to answer questions and solve tasks. In attendance are:"
+    )
+
+    allowed_speaker_transitions_dict: dict[str, list[Agent]] = field(init=False)
+
+    def __post_init__(self):
+        # Post init steers clears of the automatically generated __init__ method from dataclass
+
+        if self.allow_repeat_speaker is not None and not isinstance(self.allow_repeat_speaker, (bool, list)):
+            raise ValueError("GroupChat allow_repeat_speaker should be a bool or a list of Agents.")
+
+        # Here, we create allowed_speaker_transitions_dict from the supplied allowed_or_disallowed_speaker_transitions and speaker_transitions_type, and lastly checks for validity.
+
+        # Check input
+        if self.speaker_transitions_type is not None:
+            self.speaker_transitions_type = self.speaker_transitions_type.lower()
+
+        if self.speaker_transitions_type not in self._VALID_SPEAKER_TRANSITIONS_TYPE:
+            raise ValueError(
+                f"GroupChat speaker_transitions_type is set to '{self.speaker_transitions_type}'. "
+                f"It should be one of {self._VALID_SPEAKER_TRANSITIONS_TYPE} (case insensitive). "
+            )
+
+        # If both self.allowed_or_disallowed_speaker_transitions is None and self.allow_repeat_speaker is None, set allow_repeat_speaker to True to ensure backward compatibility
+        # Discussed in https://github.com/microsoft/autogen/pull/857#discussion_r1451541204
+        if self.allowed_or_disallowed_speaker_transitions is None and self.allow_repeat_speaker is None:
+            self.allow_repeat_speaker = True
+
+        # self.allowed_or_disallowed_speaker_transitions and self.allow_repeat_speaker are mutually exclusive parameters.
+        # Discussed in https://github.com/microsoft/autogen/pull/857#discussion_r1451266661
+        if self.allowed_or_disallowed_speaker_transitions is not None and self.allow_repeat_speaker is not None:
+            raise ValueError(
+                "Don't provide both allowed_or_disallowed_speaker_transitions and allow_repeat_speaker in group chat. "
+                "Please set one of them to None."
+            )
+
+        # Asks the user to specify whether the speaker_transitions_type is allowed or disallowed if speaker_transitions_type is supplied
+        # Discussed in https://github.com/microsoft/autogen/pull/857#discussion_r1451259524
+        if self.allowed_or_disallowed_speaker_transitions is not None and self.speaker_transitions_type is None:
+            raise ValueError(
+                "GroupChat allowed_or_disallowed_speaker_transitions is not None, but speaker_transitions_type is None. "
+                "Please set speaker_transitions_type to either 'allowed' or 'disallowed'."
+            )
+
+        # Inferring self.allowed_speaker_transitions_dict
+        # Create self.allowed_speaker_transitions_dict if allowed_or_disallowed_speaker_transitions is None, using allow_repeat_speaker
+        if self.allowed_or_disallowed_speaker_transitions is None:
+            self.allowed_speaker_transitions_dict = {}
+
+            # Create a fully connected allowed_speaker_transitions_dict not including self loops
+            for agent in self.agents:
+                self.allowed_speaker_transitions_dict[agent] = [
+                    other_agent for other_agent in self.agents if other_agent != agent
+                ]
+
+            # If self.allow_repeat_speaker is True, add self loops to all agents
+            if self.allow_repeat_speaker is True:
+                for agent in self.agents:
+                    self.allowed_speaker_transitions_dict[agent].append(agent)
+
+            # Else if self.allow_repeat_speaker is a list of Agents, add self loops to the agents in the list
+            elif isinstance(self.allow_repeat_speaker, list):
+                for agent in self.allow_repeat_speaker:
+                    self.allowed_speaker_transitions_dict[agent].append(agent)
+
+        # Create self.allowed_speaker_transitions_dict if allowed_or_disallowed_speaker_transitions is not None, using allowed_or_disallowed_speaker_transitions
+        else:
+            # Process based on speaker_transitions_type
+            if self.speaker_transitions_type == "allowed":
+                self.allowed_speaker_transitions_dict = self.allowed_or_disallowed_speaker_transitions
+            else:
+                # Logic for processing disallowed allowed_or_disallowed_speaker_transitions to allowed_speaker_transitions_dict
+                self.allowed_speaker_transitions_dict = invert_disallowed_to_allowed(
+                    self.allowed_or_disallowed_speaker_transitions, self.agents
+                )
+
+        # Check for validity
+        check_graph_validity(
+            allowed_speaker_transitions_dict=self.allowed_speaker_transitions_dict,
+            agents=self.agents,
+        )
+
+        # Check select speaker messages, prompts, roles, and retries have values
+        if self.select_speaker_message_template is None or len(self.select_speaker_message_template) == 0:
+            raise ValueError("select_speaker_message_template cannot be empty or None.")
+
+        if self.select_speaker_prompt_template is not None and len(self.select_speaker_prompt_template) == 0:
+            self.select_speaker_prompt_template = None
+
+        if self.role_for_select_speaker_messages is None or len(self.role_for_select_speaker_messages) == 0:
+            raise ValueError("role_for_select_speaker_messages cannot be empty or None.")
+
+        if self.select_speaker_auto_multiple_template is None or len(self.select_speaker_auto_multiple_template) == 0:
+            raise ValueError("select_speaker_auto_multiple_template cannot be empty or None.")
+
+        if self.select_speaker_auto_none_template is None or len(self.select_speaker_auto_none_template) == 0:
+            raise ValueError("select_speaker_auto_none_template cannot be empty or None.")
+
+        if self.max_retries_for_selecting_speaker is None or len(self.role_for_select_speaker_messages) == 0:
+            raise ValueError("role_for_select_speaker_messages cannot be empty or None.")
+
+        # Validate max select speakers retries
+        if self.max_retries_for_selecting_speaker is None or not isinstance(
+            self.max_retries_for_selecting_speaker, int
+        ):
+            raise ValueError("max_retries_for_selecting_speaker cannot be None or non-int")
+        elif self.max_retries_for_selecting_speaker < 0:
+            raise ValueError("max_retries_for_selecting_speaker must be greater than or equal to zero")
+
+        # Load message transforms here (load once for the Group Chat so we don't have to re-initiate it and it maintains the cache across subsequent select speaker calls)
+        if self.select_speaker_transform_messages is not None:
+            if isinstance(self.select_speaker_transform_messages, transform_messages.TransformMessages):
+                self._speaker_selection_transforms = self.select_speaker_transform_messages
+            else:
+                raise ValueError("select_speaker_transform_messages must be None or MessageTransforms.")
+        else:
+            self._speaker_selection_transforms = None
+
+        # Validate select_speaker_auto_verbose
+        if self.select_speaker_auto_verbose is None or not isinstance(self.select_speaker_auto_verbose, bool):
+            raise ValueError("select_speaker_auto_verbose cannot be None or non-bool")
+
+    @property
+    def agent_names(self) -> list[str]:
+        """Return the names of the agents in the group chat."""
+        return [agent.name for agent in self.agents]
+
+    def reset(self):
+        """Reset the group chat."""
+        self.messages.clear()
+
+    def append(self, message: dict[str, Any], speaker: Agent):
+        """Append a message to the group chat.
+        We cast the content to str here so that it can be managed by text-based
+        model.
+        """
+        # set the name to speaker's name if the role is not function
+        # if the role is tool, it is OK to modify the name
+        if message["role"] != "function":
+            message["name"] = speaker.name
+        if not isinstance(message["content"], str) and not isinstance(message["content"], list):
+            message["content"] = str(message["content"])
+        message["content"] = content_str(message["content"])
+        self.messages.append(message)
+
+    def agent_by_name(
+        self, name: str, recursive: bool = False, raise_on_name_conflict: bool = False
+    ) -> Optional[Agent]:
+        """Returns the agent with a given name. If recursive is True, it will search in nested teams."""
+        agents = self.nested_agents() if recursive else self.agents
+        filtered_agents = [agent for agent in agents if agent.name == name]
+
+        if raise_on_name_conflict and len(filtered_agents) > 1:
+            raise AgentNameConflictError()
+
+        return filtered_agents[0] if filtered_agents else None
+
+    def nested_agents(self) -> list[Agent]:
+        """Returns all agents in the group chat manager."""
+        agents = self.agents.copy()
+        for agent in agents:
+            if isinstance(agent, GroupChatManager):
+                # Recursive call for nested teams
+                agents.extend(agent.groupchat.nested_agents())
+        return agents
+
+    def next_agent(self, agent: Agent, agents: Optional[list[Agent]] = None) -> Agent:
+        """Return the next agent in the list."""
+        if agents is None:
+            agents = self.agents
+
+        # Ensure the provided list of agents is a subset of self.agents
+        if not set(agents).issubset(set(self.agents)):
+            raise UndefinedNextAgentError()
+
+        # What index is the agent? (-1 if not present)
+        idx = self.agent_names.index(agent.name) if agent.name in self.agent_names else -1
+
+        # Return the next agent
+        if agents == self.agents:
+            return agents[(idx + 1) % len(agents)]
+        else:
+            offset = idx + 1
+            for i in range(len(self.agents)):
+                if self.agents[(offset + i) % len(self.agents)] in agents:
+                    return self.agents[(offset + i) % len(self.agents)]
+
+        # Explicitly handle cases where no valid next agent exists in the provided subset.
+        raise UndefinedNextAgentError()
+
+    def select_speaker_msg(self, agents: Optional[list[Agent]] = None) -> str:
+        """Return the system message for selecting the next speaker. This is always the *first* message in the context."""
+        if agents is None:
+            agents = self.agents
+
+        roles = self._participant_roles(agents)
+        agentlist = f"{[agent.name for agent in agents]}"
+
+        return_msg = self.select_speaker_message_template.format(roles=roles, agentlist=agentlist)
+        return return_msg
+
+    def select_speaker_prompt(self, agents: Optional[list[Agent]] = None) -> str:
+        """Return the floating system prompt selecting the next speaker.
+        This is always the *last* message in the context.
+        Will return None if the select_speaker_prompt_template is None.
+        """
+        if self.select_speaker_prompt_template is None:
+            return None
+
+        if agents is None:
+            agents = self.agents
+
+        agentlist = f"{[agent.name for agent in agents]}"
+
+        return_prompt = f"{self.select_speaker_prompt_template}".replace("{agentlist}", agentlist)
+        return return_prompt
+
+    def introductions_msg(self, agents: Optional[list[Agent]] = None) -> str:
+        """Return the system message for selecting the next speaker. This is always the *first* message in the context."""
+        if agents is None:
+            agents = self.agents
+
+        # Use the class attribute instead of a hardcoded string
+        intro_msg = self.DEFAULT_INTRO_MSG
+        participant_roles = self._participant_roles(agents)
+
+        return f"{intro_msg}\n\n{participant_roles}"
+
+    def manual_select_speaker(self, agents: Optional[list[Agent]] = None) -> Union[Agent, None]:
+        """Manually select the next speaker."""
+        iostream = IOStream.get_default()
+
+        if agents is None:
+            agents = self.agents
+
+        iostream.send(SelectSpeakerEvent(agents=agents))
+
+        try_count = 0
+        # Assume the user will enter a valid number within 3 tries, otherwise use auto selection to avoid blocking.
+        while try_count <= 3:
+            try_count += 1
+            if try_count >= 3:
+                iostream.send(SelectSpeakerTryCountExceededEvent(try_count=try_count, agents=agents))
+                break
+            try:
+                i = iostream.input(
+                    "Enter the number of the next speaker (enter nothing or `q` to use auto selection): "
+                )
+                if i == "" or i == "q":
+                    break
+                i = int(i)
+                if i > 0 and i <= len(agents):
+                    return agents[i - 1]
+                else:
+                    raise ValueError
+            except ValueError:
+                iostream.send(SelectSpeakerInvalidInputEvent(agents=agents))
+        return None
+
+    def random_select_speaker(self, agents: Optional[list[Agent]] = None) -> Union[Agent, None]:
+        """Randomly select the next speaker."""
+        if agents is None:
+            agents = self.agents
+        return random.choice(agents)
+
+    def _prepare_and_select_agents(
+        self,
+        last_speaker: Agent,
+    ) -> tuple[Optional[Agent], list[Agent], Optional[list[dict[str, Any]]]]:
+        # If self.speaker_selection_method is a callable, call it to get the next speaker.
+        # If self.speaker_selection_method is a string, return it.
+        speaker_selection_method = self.speaker_selection_method
+        if isinstance(self.speaker_selection_method, Callable):
+            selected_agent = self.speaker_selection_method(last_speaker, self)
+            if selected_agent is None:
+                raise NoEligibleSpeakerError(
+                    "Custom speaker selection function returned None. Terminating conversation."
+                )
+            elif isinstance(selected_agent, Agent):
+                if selected_agent in self.agents:
+                    return selected_agent, self.agents, None
+                else:
+                    raise ValueError(
+                        f"Custom speaker selection function returned an agent {selected_agent.name} not in the group chat."
+                    )
+            elif isinstance(selected_agent, str):
+                # If returned a string, assume it is a speaker selection method
+                speaker_selection_method = selected_agent
+            else:
+                raise ValueError(
+                    f"Custom speaker selection function returned an object of type {type(selected_agent)} instead of Agent or str."
+                )
+
+        if speaker_selection_method.lower() not in self._VALID_SPEAKER_SELECTION_METHODS:
+            raise ValueError(
+                f"GroupChat speaker_selection_method is set to '{speaker_selection_method}'. "
+                f"It should be one of {self._VALID_SPEAKER_SELECTION_METHODS} (case insensitive). "
+            )
+
+        # If provided a list, make sure the agent is in the list
+        allow_repeat_speaker = (
+            self.allow_repeat_speaker
+            if isinstance(self.allow_repeat_speaker, bool) or self.allow_repeat_speaker is None
+            else last_speaker in self.allow_repeat_speaker
+        )
+
+        agents = self.agents
+        n_agents = len(agents)
+        # Warn if GroupChat is underpopulated
+        if n_agents < 2:
+            raise ValueError(
+                f"GroupChat is underpopulated with {n_agents} agents. "
+                "Please add more agents to the GroupChat or use direct communication instead."
+            )
+        elif n_agents == 2 and speaker_selection_method.lower() != "round_robin" and allow_repeat_speaker:
+            logger.warning(
+                f"GroupChat is underpopulated with {n_agents} agents. "
+                "Consider setting speaker_selection_method to 'round_robin' or allow_repeat_speaker to False, "
+                "or use direct communication, unless repeated speaker is desired."
+            )
+
+        if (
+            self.func_call_filter
+            and self.messages
+            and ("function_call" in self.messages[-1] or "tool_calls" in self.messages[-1])
+        ):
+            funcs = []
+            if "function_call" in self.messages[-1]:
+                funcs += [self.messages[-1]["function_call"]["name"]]
+            if "tool_calls" in self.messages[-1]:
+                funcs += [
+                    tool["function"]["name"] for tool in self.messages[-1]["tool_calls"] if tool["type"] == "function"
+                ]
+
+            # find agents with the right function_map which contains the function name
+            agents = [agent for agent in self.agents if agent.can_execute_function(funcs)]
+            if len(agents) == 1:
+                # only one agent can execute the function
+                return agents[0], agents, None
+            elif not agents:
+                # find all the agents with function_map
+                agents = [agent for agent in self.agents if agent.function_map]
+                if len(agents) == 1:
+                    return agents[0], agents, None
+                elif not agents:
+                    raise ValueError(
+                        f"No agent can execute the function {', '.join(funcs)}. "
+                        "Please check the function_map of the agents."
+                    )
+        # remove the last speaker from the list to avoid selecting the same speaker if allow_repeat_speaker is False
+        agents = [agent for agent in agents if agent != last_speaker] if allow_repeat_speaker is False else agents
+
+        # Filter agents with allowed_speaker_transitions_dict
+
+        is_last_speaker_in_group = last_speaker in self.agents
+
+        # this condition means last_speaker is a sink in the graph, then no agents are eligible
+        if last_speaker not in self.allowed_speaker_transitions_dict and is_last_speaker_in_group:
+            raise NoEligibleSpeakerError(
+                f"Last speaker {last_speaker.name} is not in the allowed_speaker_transitions_dict."
+            )
+        # last_speaker is not in the group, so all agents are eligible
+        elif last_speaker not in self.allowed_speaker_transitions_dict and not is_last_speaker_in_group:
+            graph_eligible_agents = []
+        else:
+            # Extract agent names from the list of agents
+            graph_eligible_agents = [
+                agent for agent in agents if agent in self.allowed_speaker_transitions_dict[last_speaker]
+            ]
+
+        # If there is only one eligible agent, just return it to avoid the speaker selection prompt
+        if len(graph_eligible_agents) == 1:
+            return graph_eligible_agents[0], graph_eligible_agents, None
+
+        # If there are no eligible agents, return None, which means all agents will be taken into consideration in the next step
+        if len(graph_eligible_agents) == 0:
+            graph_eligible_agents = None
+
+        # Use the selected speaker selection method
+        select_speaker_messages = None
+        if speaker_selection_method.lower() == "manual":
+            selected_agent = self.manual_select_speaker(graph_eligible_agents)
+        elif speaker_selection_method.lower() == "round_robin":
+            selected_agent = self.next_agent(last_speaker, graph_eligible_agents)
+        elif speaker_selection_method.lower() == "random":
+            selected_agent = self.random_select_speaker(graph_eligible_agents)
+        else:  # auto
+            selected_agent = None
+            select_speaker_messages = self.messages.copy()
+            # If last message is a tool call or function call, blank the call so the api doesn't throw
+            if select_speaker_messages[-1].get("function_call", False):
+                select_speaker_messages[-1] = dict(select_speaker_messages[-1], function_call=None)
+            if select_speaker_messages[-1].get("tool_calls", False):
+                select_speaker_messages[-1] = dict(select_speaker_messages[-1], tool_calls=None)
+        return selected_agent, graph_eligible_agents, select_speaker_messages
+
+    def select_speaker(self, last_speaker: Agent, selector: ConversableAgent) -> Agent:
+        """Select the next speaker (with requery)."""
+        # Prepare the list of available agents and select an agent if selection method allows (non-auto)
+        selected_agent, agents, messages = self._prepare_and_select_agents(last_speaker)
+        if selected_agent:
+            return selected_agent
+        elif self.speaker_selection_method == "manual":
+            # An agent has not been selected while in manual mode, so move to the next agent
+            return self.next_agent(last_speaker)
+
+        # auto speaker selection with 2-agent chat
+        return self._auto_select_speaker(last_speaker, selector, messages, agents)
+
+    async def a_select_speaker(self, last_speaker: Agent, selector: ConversableAgent) -> Agent:
+        """Select the next speaker (with requery), asynchronously."""
+        selected_agent, agents, messages = self._prepare_and_select_agents(last_speaker)
+        if selected_agent:
+            return selected_agent
+        elif self.speaker_selection_method == "manual":
+            # An agent has not been selected while in manual mode, so move to the next agent
+            return self.next_agent(last_speaker)
+
+        # auto speaker selection with 2-agent chat
+        return await self.a_auto_select_speaker(last_speaker, selector, messages, agents)
+
+    def _finalize_speaker(self, last_speaker: Agent, final: bool, name: str, agents: Optional[list[Agent]]) -> Agent:
+        if not final:
+            # the LLM client is None, thus no reply is generated. Use round robin instead.
+            return self.next_agent(last_speaker, agents)
+
+        # If exactly one agent is mentioned, use it. Otherwise, leave the OAI response unmodified
+        mentions = self._mentioned_agents(name, agents)
+        if len(mentions) == 1:
+            name = next(iter(mentions))
+        else:
+            logger.warning(
+                f"GroupChat select_speaker failed to resolve the next speaker's name. This is because the speaker selection OAI call returned:\n{name}"
+            )
+
+        # Return the result
+        agent = self.agent_by_name(name)
+        return agent if agent else self.next_agent(last_speaker, agents)
+
+    def _register_client_from_config(self, agent: Agent, config: dict):
+        model_client_cls_to_match = config.get("model_client_cls")
+        if model_client_cls_to_match:
+            if not self.select_speaker_auto_model_client_cls:
+                raise ValueError(
+                    "A custom model was detected in the config but no 'model_client_cls' "
+                    "was supplied for registration in GroupChat."
+                )
+
+            if isinstance(self.select_speaker_auto_model_client_cls, list):
+                # Register the first custom model client class matching the name specified in the config
+                matching_model_cls = [
+                    client_cls
+                    for client_cls in self.select_speaker_auto_model_client_cls
+                    if client_cls.__name__ == model_client_cls_to_match
+                ]
+                if len(set(matching_model_cls)) > 1:
+                    raise RuntimeError(
+                        f"More than one unique 'model_client_cls' with __name__ '{model_client_cls_to_match}'."
+                    )
+                if not matching_model_cls:
+                    raise ValueError(
+                        "No model's __name__ matches the model client class "
+                        f"'{model_client_cls_to_match}' specified in select_speaker_auto_llm_config."
+                    )
+                select_speaker_auto_model_client_cls = matching_model_cls[0]
+            else:
+                # Register the only custom model client
+                select_speaker_auto_model_client_cls = self.select_speaker_auto_model_client_cls
+
+            agent.register_model_client(select_speaker_auto_model_client_cls)
+
+    def _register_custom_model_clients(self, agent: ConversableAgent):
+        if not self.select_speaker_auto_llm_config:
+            return
+
+        config_format_is_list = "config_list" in self.select_speaker_auto_llm_config
+        if config_format_is_list:
+            for config in self.select_speaker_auto_llm_config["config_list"]:
+                self._register_client_from_config(agent, config)
+        elif not config_format_is_list:
+            self._register_client_from_config(agent, self.select_speaker_auto_llm_config)
+
+    def _create_internal_agents(
+        self, agents, max_attempts, messages, validate_speaker_name, selector: Optional[ConversableAgent] = None
+    ):
+        checking_agent = ConversableAgent("checking_agent", default_auto_reply=max_attempts)
+
+        # Register the speaker validation function with the checking agent
+        checking_agent.register_reply(
+            [ConversableAgent, None],
+            reply_func=validate_speaker_name,  # Validate each response
+            remove_other_reply_funcs=True,
+        )
+
+        # Override the selector's config if one was passed as a parameter to this class
+        speaker_selection_llm_config = self.select_speaker_auto_llm_config or selector.llm_config
+
+        if speaker_selection_llm_config is False:
+            raise ValueError(
+                "The group chat's internal speaker selection agent does not have an LLM configuration. Please provide a valid LLM config to the group chat's GroupChatManager or set it with the select_speaker_auto_llm_config parameter."
+            )
+
+        # Agent for selecting a single agent name from the response
+        speaker_selection_agent = ConversableAgent(
+            "speaker_selection_agent",
+            system_message=self.select_speaker_msg(agents),
+            chat_messages={checking_agent: messages},
+            llm_config=speaker_selection_llm_config,
+            human_input_mode="NEVER",
+            # Suppresses some extra terminal outputs, outputs will be handled by select_speaker_auto_verbose
+        )
+
+        # Register any custom model passed in select_speaker_auto_llm_config with the speaker_selection_agent
+        self._register_custom_model_clients(speaker_selection_agent)
+
+        return checking_agent, speaker_selection_agent
+
+    def _auto_select_speaker(
+        self,
+        last_speaker: Agent,
+        selector: ConversableAgent,
+        messages: Optional[list[dict[str, Any]]],
+        agents: Optional[list[Agent]],
+    ) -> Agent:
+        """Selects next speaker for the "auto" speaker selection method. Utilises its own two-agent chat to determine the next speaker and supports requerying.
+
+        Speaker selection for "auto" speaker selection method:
+        1. Create a two-agent chat with a speaker selector agent and a speaker validator agent, like a nested chat
+        2. Inject the group messages into the new chat
+        3. Run the two-agent chat, evaluating the result of response from the speaker selector agent:
+            - If a single agent is provided then we return it and finish. If not, we add an additional message to this nested chat in an attempt to guide the LLM to a single agent response
+        4. Chat continues until a single agent is nominated or there are no more attempts left
+        5. If we run out of turns and no single agent can be determined, the next speaker in the list of agents is returned
+
+        Args:
+            last_speaker: The previous speaker in the group chat
+            selector: The ConversableAgent that initiated the speaker selection
+            messages: Current chat messages
+            agents: Valid list of agents for speaker selection
+
+        Returns:
+            A counter for mentioned agents.
+        """
+        # If no agents are passed in, assign all the group chat's agents
+        if agents is None:
+            agents = self.agents
+
+        # The maximum number of speaker selection attempts (including requeries)
+        # is the initial speaker selection attempt plus the maximum number of retries.
+        # We track these and use them in the validation function as we can't
+        # access the max_turns from within validate_speaker_name.
+        max_attempts = 1 + self.max_retries_for_selecting_speaker
+        attempts_left = max_attempts
+        attempt = 0
+
+        # Registered reply function for checking_agent, checks the result of the response for agent names
+        def validate_speaker_name(
+            recipient, messages, sender, config
+        ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+            # The number of retries left, starting at max_retries_for_selecting_speaker
+            nonlocal attempts_left
+            nonlocal attempt
+
+            attempt = attempt + 1
+            attempts_left = attempts_left - 1
+
+            return self._validate_speaker_name(recipient, messages, sender, config, attempts_left, attempt, agents)
+
+        # Two-agent chat for speaker selection
+
+        # Agent for checking the response from the speaker_select_agent
+        checking_agent, speaker_selection_agent = self._create_internal_agents(
+            agents, max_attempts, messages, validate_speaker_name, selector
+        )
+
+        # Create the starting message
+        if self.select_speaker_prompt_template is not None:
+            start_message = {
+                "content": self.select_speaker_prompt(agents),
+                "name": "checking_agent",
+                "override_role": self.role_for_select_speaker_messages,
+            }
+        else:
+            start_message = messages[-1]
+
+        # Add the message transforms, if any, to the speaker selection agent
+        if self._speaker_selection_transforms is not None:
+            self._speaker_selection_transforms.add_to_agent(speaker_selection_agent)
+
+        # Run the speaker selection chat
+        result = checking_agent.initiate_chat(
+            speaker_selection_agent,
+            cache=None,  # don't use caching for the speaker selection chat
+            message=start_message,
+            max_turns=2
+            * max(1, max_attempts),  # Limiting the chat to the number of attempts, including the initial one
+            clear_history=False,
+            silent=not self.select_speaker_auto_verbose,  # Base silence on the verbose attribute
+        )
+
+        return self._process_speaker_selection_result(result, last_speaker, agents)
+
+    async def a_auto_select_speaker(
+        self,
+        last_speaker: Agent,
+        selector: ConversableAgent,
+        messages: Optional[list[dict[str, Any]]],
+        agents: Optional[list[Agent]],
+    ) -> Agent:
+        """(Asynchronous) Selects next speaker for the "auto" speaker selection method. Utilises its own two-agent chat to determine the next speaker and supports requerying.
+
+        Speaker selection for "auto" speaker selection method:
+        1. Create a two-agent chat with a speaker selector agent and a speaker validator agent, like a nested chat
+        2. Inject the group messages into the new chat
+        3. Run the two-agent chat, evaluating the result of response from the speaker selector agent:
+            - If a single agent is provided then we return it and finish. If not, we add an additional message to this nested chat in an attempt to guide the LLM to a single agent response
+        4. Chat continues until a single agent is nominated or there are no more attempts left
+        5. If we run out of turns and no single agent can be determined, the next speaker in the list of agents is returned
+
+        Args:
+            last_speaker: The previous speaker in the group chat
+            selector: The ConversableAgent that initiated the speaker selection
+            messages: Current chat messages
+            agents: Valid list of agents for speaker selection
+
+        Returns:
+            A counter for mentioned agents.
+        """
+        # If no agents are passed in, assign all the group chat's agents
+        if agents is None:
+            agents = self.agents
+
+        # The maximum number of speaker selection attempts (including requeries)
+        # We track these and use them in the validation function as we can't
+        # access the max_turns from within validate_speaker_name
+        max_attempts = 1 + self.max_retries_for_selecting_speaker
+        attempts_left = max_attempts
+        attempt = 0
+
+        # Registered reply function for checking_agent, checks the result of the response for agent names
+        def validate_speaker_name(
+            recipient, messages, sender, config
+        ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+            # The number of retries left, starting at max_retries_for_selecting_speaker
+            nonlocal attempts_left
+            nonlocal attempt
+
+            attempt = attempt + 1
+            attempts_left = attempts_left - 1
+
+            return self._validate_speaker_name(recipient, messages, sender, config, attempts_left, attempt, agents)
+
+        # Two-agent chat for speaker selection
+
+        # Agent for checking the response from the speaker_select_agent
+        checking_agent, speaker_selection_agent = self._create_internal_agents(
+            agents, max_attempts, messages, validate_speaker_name, selector
+        )
+
+        # Create the starting message
+        if self.select_speaker_prompt_template is not None:
+            start_message = {
+                "content": self.select_speaker_prompt(agents),
+                "override_role": self.role_for_select_speaker_messages,
+            }
+        else:
+            start_message = messages[-1]
+
+        # Add the message transforms, if any, to the speaker selection agent
+        if self._speaker_selection_transforms is not None:
+            self._speaker_selection_transforms.add_to_agent(speaker_selection_agent)
+
+        # Run the speaker selection chat
+        result = await checking_agent.a_initiate_chat(
+            speaker_selection_agent,
+            cache=None,  # don't use caching for the speaker selection chat
+            message=start_message,
+            max_turns=2
+            * max(1, max_attempts),  # Limiting the chat to the number of attempts, including the initial one
+            clear_history=False,
+            silent=not self.select_speaker_auto_verbose,  # Base silence on the verbose attribute
+        )
+
+        return self._process_speaker_selection_result(result, last_speaker, agents)
+
+    def _validate_speaker_name(
+        self, recipient, messages, sender, config, attempts_left, attempt, agents
+    ) -> tuple[bool, Optional[Union[str, dict[str, Any]]]]:
+        """Validates the speaker response for each round in the internal 2-agent
+        chat within the  auto select speaker method.
+
+        Used by auto_select_speaker and a_auto_select_speaker.
+        """
+        # Validate the speaker name selected
+        select_name = messages[-1]["content"].strip()
+
+        mentions = self._mentioned_agents(select_name, agents)
+
+        # Output the query and requery results
+        if self.select_speaker_auto_verbose:
+            iostream = IOStream.get_default()
+            no_of_mentions = len(mentions)
+            if no_of_mentions == 1:
+                # Success on retry, we have just one name mentioned
+                iostream.send(
+                    SpeakerAttemptSuccessfulEvent(
+                        mentions=mentions,
+                        attempt=attempt,
+                        attempts_left=attempts_left,
+                        select_speaker_auto_verbose=self.select_speaker_auto_verbose,
+                    )
+                )
+            elif no_of_mentions == 1:
+                iostream.send(
+                    SpeakerAttemptFailedMultipleAgentsEvent(
+                        mentions=mentions,
+                        attempt=attempt,
+                        attempts_left=attempts_left,
+                        select_speaker_auto_verbose=self.select_speaker_auto_verbose,
+                    )
+                )
+            else:
+                iostream.send(
+                    SpeakerAttemptFailedNoAgentsEvent(
+                        mentions=mentions,
+                        attempt=attempt,
+                        attempts_left=attempts_left,
+                        select_speaker_auto_verbose=self.select_speaker_auto_verbose,
+                    )
+                )
+
+        if len(mentions) == 1:
+            # Success on retry, we have just one name mentioned
+            selected_agent_name = next(iter(mentions))
+
+            # Add the selected agent to the response so we can return it
+            messages.append({"role": "user", "content": f"[AGENT SELECTED]{selected_agent_name}"})
+
+        elif len(mentions) > 1:
+            # More than one name on requery so add additional reminder prompt for next retry
+
+            if attempts_left:
+                # Message to return to the chat for the next attempt
+                agentlist = f"{[agent.name for agent in agents]}"
+
+                return True, {
+                    "content": self.select_speaker_auto_multiple_template.format(agentlist=agentlist),
+                    "name": "checking_agent",
+                    "override_role": self.role_for_select_speaker_messages,
+                }
+            else:
+                # Final failure, no attempts left
+                messages.append({
+                    "role": "user",
+                    "content": f"[AGENT SELECTION FAILED]Select speaker attempt #{attempt} of {attempt + attempts_left} failed as it returned multiple names.",
+                })
+
+        else:
+            # No names at all on requery so add additional reminder prompt for next retry
+
+            if attempts_left:
+                # Message to return to the chat for the next attempt
+                agentlist = f"{[agent.name for agent in agents]}"
+
+                return True, {
+                    "content": self.select_speaker_auto_none_template.format(agentlist=agentlist),
+                    "name": "checking_agent",
+                    "override_role": self.role_for_select_speaker_messages,
+                }
+            else:
+                # Final failure, no attempts left
+                messages.append({
+                    "role": "user",
+                    "content": f"[AGENT SELECTION FAILED]Select speaker attempt #{attempt} of {attempt + attempts_left} failed as it did not include any agent names.",
+                })
+
+        return True, None
+
+    def _process_speaker_selection_result(self, result, last_speaker: ConversableAgent, agents: Optional[list[Agent]]):
+        """Checks the result of the auto_select_speaker function, returning the
+        agent to speak.
+
+        Used by auto_select_speaker and a_auto_select_speaker.
+        """
+        if len(result.chat_history) > 0:
+            # Use the final message, which will have the selected agent or reason for failure
+            final_message = result.chat_history[-1]["content"]
+
+            if "[AGENT SELECTED]" in final_message:
+                # Have successfully selected an agent, return it
+                return self.agent_by_name(final_message.replace("[AGENT SELECTED]", ""))
+
+            else:  # "[AGENT SELECTION FAILED]"
+                # Failed to select an agent, so we'll select the next agent in the list
+                next_agent = self.next_agent(last_speaker, agents)
+
+                # No agent, return the failed reason
+                return next_agent
+
+    def _participant_roles(self, agents: list[Agent] = None) -> str:
+        # Default to all agents registered
+        if agents is None:
+            agents = self.agents
+
+        roles = []
+        for agent in agents:
+            if agent.description.strip() == "":
+                logger.warning(
+                    f"The agent '{agent.name}' has an empty description, and may not work well with GroupChat."
+                )
+            roles.append(f"{agent.name}: {agent.description}".strip())
+        return "\n".join(roles)
+
+    def _mentioned_agents(self, message_content: Union[str, list], agents: Optional[list[Agent]]) -> dict:
+        """Counts the number of times each agent is mentioned in the provided message content.
+        Agent names will match under any of the following conditions (all case-sensitive):
+        - Exact name match
+        - If the agent name has underscores it will match with spaces instead (e.g. 'Story_writer' == 'Story writer')
+        - If the agent name has underscores it will match with '\\_' instead of '_' (e.g. 'Story_writer' == 'Story\\_writer')
+
+        Args:
+            message_content (Union[str, List]): The content of the message, either as a single string or a list of strings.
+            agents (List[Agent]): A list of Agent objects, each having a 'name' attribute to be searched in the message content.
+
+        Returns:
+            Dict: a counter for mentioned agents.
+        """
+        if agents is None:
+            agents = self.agents
+
+        # Cast message content to str
+        if isinstance(message_content, dict):
+            message_content = message_content["content"]
+        message_content = content_str(message_content)
+
+        mentions = dict()
+        for agent in agents:
+            # Finds agent mentions, taking word boundaries into account,
+            # accommodates escaping underscores and underscores as spaces
+            regex = (
+                r"(?<=\W)("
+                + re.escape(agent.name)
+                + r"|"
+                + re.escape(agent.name.replace("_", " "))
+                + r"|"
+                + re.escape(agent.name.replace("_", r"\_"))
+                + r")(?=\W)"
+            )
+            count = len(re.findall(regex, f" {message_content} "))  # Pad the message to help with matching
+            if count > 0:
+                mentions[agent.name] = count
+        return mentions
+
+
+@export_module("autogen")
+class GroupChatManager(ConversableAgent):
+    """(In preview) A chat manager agent that can manage a group chat of multiple agents."""
+
+    def __init__(
+        self,
+        groupchat: GroupChat,
+        name: Optional[str] = "chat_manager",
+        # unlimited consecutive auto reply by default
+        max_consecutive_auto_reply: Optional[int] = sys.maxsize,
+        human_input_mode: Literal["ALWAYS", "NEVER", "TERMINATE"] = "NEVER",
+        system_message: Optional[Union[str, list]] = "Group chat manager.",
+        silent: bool = False,
+        **kwargs: Any,
+    ):
+        if (
+            kwargs.get("llm_config")
+            and isinstance(kwargs["llm_config"], dict)
+            and (kwargs["llm_config"].get("functions") or kwargs["llm_config"].get("tools"))
+        ):
+            raise ValueError(
+                "GroupChatManager is not allowed to make function/tool calls. Please remove the 'functions' or 'tools' config in 'llm_config' you passed in."
+            )
+
+        super().__init__(
+            name=name,
+            max_consecutive_auto_reply=max_consecutive_auto_reply,
+            human_input_mode=human_input_mode,
+            system_message=system_message,
+            **kwargs,
+        )
+        if logging_enabled():
+            log_new_agent(self, locals())
+        # Store groupchat
+        self._groupchat = groupchat
+
+        self._last_speaker = None
+        self._silent = silent
+
+        # Order of register_reply is important.
+        # Allow sync chat if initiated using initiate_chat
+        self.register_reply(Agent, GroupChatManager.run_chat, config=groupchat, reset_config=GroupChat.reset)
+        # Allow async chat if initiated using a_initiate_chat
+        self.register_reply(
+            Agent,
+            GroupChatManager.a_run_chat,
+            config=groupchat,
+            reset_config=GroupChat.reset,
+            ignore_async_in_sync_chat=True,
+        )
+
+    @property
+    def groupchat(self) -> GroupChat:
+        """Returns the group chat managed by the group chat manager."""
+        return self._groupchat
+
+    def chat_messages_for_summary(self, agent: Agent) -> list[dict[str, Any]]:
+        """The list of messages in the group chat as a conversation to summarize.
+        The agent is ignored.
+        """
+        return self._groupchat.messages
+
+    def _prepare_chat(
+        self,
+        recipient: ConversableAgent,
+        clear_history: bool,
+        prepare_recipient: bool = True,
+        reply_at_receive: bool = True,
+    ) -> None:
+        super()._prepare_chat(recipient, clear_history, prepare_recipient, reply_at_receive)
+
+        if clear_history:
+            self._groupchat.reset()
+
+        for agent in self._groupchat.agents:
+            if (recipient != agent or prepare_recipient) and isinstance(agent, ConversableAgent):
+                agent._prepare_chat(self, clear_history, False, reply_at_receive)
+
+    @property
+    def last_speaker(self) -> Agent:
+        """Return the agent who sent the last message to group chat manager.
+
+        In a group chat, an agent will always send a message to the group chat manager, and the group chat manager will
+        send the message to all other agents in the group chat. So, when an agent receives a message, it will always be
+        from the group chat manager. With this property, the agent receiving the message can know who actually sent the
+        message.
+
+        Example:
+        ```python
+        from autogen import ConversableAgent
+        from autogen import GroupChat, GroupChatManager
+
+
+        def print_messages(recipient, messages, sender, config):
+            # Print the message immediately
+            print(f"Sender: {sender.name} | Recipient: {recipient.name} | Message: {messages[-1].get('content')}")
+            print(f"Real Sender: {sender.last_speaker.name}")
+            assert sender.last_speaker.name in messages[-1].get("content")
+            return False, None  # Required to ensure the agent communication flow continues
+
+
+        agent_a = ConversableAgent("agent A", default_auto_reply="I'm agent A.")
+        agent_b = ConversableAgent("agent B", default_auto_reply="I'm agent B.")
+        agent_c = ConversableAgent("agent C", default_auto_reply="I'm agent C.")
+        for agent in [agent_a, agent_b, agent_c]:
+            agent.register_reply([ConversableAgent, None], reply_func=print_messages, config=None)
+        group_chat = GroupChat(
+            [agent_a, agent_b, agent_c],
+            messages=[],
+            max_round=6,
+            speaker_selection_method="random",
+            allow_repeat_speaker=True,
+        )
+        chat_manager = GroupChatManager(group_chat)
+        groupchat_result = agent_a.initiate_chat(chat_manager, message="Hi, there, I'm agent A.")
+        ```
+        """
+        return self._last_speaker
+
+    def run_chat(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[GroupChat] = None,
+    ) -> tuple[bool, Optional[str]]:
+        """Run a group chat."""
+        iostream = IOStream.get_default()
+
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        speaker = sender
+        groupchat = config
+        send_introductions = getattr(groupchat, "send_introductions", False)
+        silent = getattr(self, "_silent", False)
+        termination_reason = None
+
+        if send_introductions:
+            # Broadcast the intro
+            intro = groupchat.introductions_msg()
+            for agent in groupchat.agents:
+                self.send(intro, agent, request_reply=False, silent=True)
+            # NOTE: We do not also append to groupchat.messages,
+            # since groupchat handles its own introductions
+
+        if self.client_cache is not None:
+            for a in groupchat.agents:
+                a.previous_cache = a.client_cache
+                a.client_cache = self.client_cache
+        for i in range(groupchat.max_round):
+            self._last_speaker = speaker
+            groupchat.append(message, speaker)
+            # broadcast the message to all agents except the speaker
+            for agent in groupchat.agents:
+                if agent != speaker:
+                    self.send(message, agent, request_reply=False, silent=True)
+            if self._is_termination_msg(message):
+                # The conversation is over
+                termination_reason = f"Termination message condition on the GroupChatManager '{self.name}' met"
+                break
+            elif i == groupchat.max_round - 1:
+                # It's the last round
+                termination_reason = f"Maximum rounds ({groupchat.max_round}) reached"
+                break
+            try:
+                # select the next speaker
+                speaker = groupchat.select_speaker(speaker, self)
+                if not silent:
+                    iostream = IOStream.get_default()
+                    iostream.send(GroupChatRunChatEvent(speaker=speaker, silent=silent))
+                # let the speaker speak
+                reply = speaker.generate_reply(sender=self)
+            except KeyboardInterrupt:
+                # let the admin agent speak if interrupted
+                if groupchat.admin_name in groupchat.agent_names:
+                    # admin agent is one of the participants
+                    speaker = groupchat.agent_by_name(groupchat.admin_name)
+                    reply = speaker.generate_reply(sender=self)
+                else:
+                    # admin agent is not found in the participants
+                    raise
+            except NoEligibleSpeakerError:
+                # No eligible speaker, terminate the conversation
+                termination_reason = "No next speaker selected"
+                break
+
+            if reply is None:
+                # no reply is generated, exit the chat
+                termination_reason = "No reply generated"
+                break
+
+            # check for "clear history" phrase in reply and activate clear history function if found
+            if (
+                groupchat.enable_clear_history
+                and isinstance(reply, dict)
+                and reply["content"]
+                and "CLEAR HISTORY" in reply["content"].upper()
+            ):
+                reply["content"] = self.clear_agents_history(reply, groupchat)
+
+            # The speaker sends the message without requesting a reply
+            speaker.send(reply, self, request_reply=False, silent=silent)
+            message = self.last_message(speaker)
+        if self.client_cache is not None:
+            for a in groupchat.agents:
+                a.client_cache = a.previous_cache
+                a.previous_cache = None
+
+        if termination_reason:
+            iostream.send(TerminationEvent(termination_reason=termination_reason))
+
+        return True, None
+
+    async def a_run_chat(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[GroupChat] = None,
+    ):
+        """Run a group chat asynchronously."""
+        iostream = IOStream.get_default()
+
+        if messages is None:
+            messages = self._oai_messages[sender]
+        message = messages[-1]
+        speaker = sender
+        groupchat = config
+        send_introductions = getattr(groupchat, "send_introductions", False)
+        silent = getattr(self, "_silent", False)
+        termination_reason = None
+
+        if send_introductions:
+            # Broadcast the intro
+            intro = groupchat.introductions_msg()
+            for agent in groupchat.agents:
+                await self.a_send(intro, agent, request_reply=False, silent=True)
+            # NOTE: We do not also append to groupchat.messages,
+            # since groupchat handles its own introductions
+
+        if self.client_cache is not None:
+            for a in groupchat.agents:
+                a.previous_cache = a.client_cache
+                a.client_cache = self.client_cache
+        for i in range(groupchat.max_round):
+            groupchat.append(message, speaker)
+            self._last_speaker = speaker
+
+            if self._is_termination_msg(message):
+                # The conversation is over
+                termination_reason = f"Termination message condition on the GroupChatManager '{self.name}' met"
+                break
+
+            # broadcast the message to all agents except the speaker
+            for agent in groupchat.agents:
+                if agent != speaker:
+                    await self.a_send(message, agent, request_reply=False, silent=True)
+            if i == groupchat.max_round - 1:
+                # the last round
+                termination_reason = f"Maximum rounds ({groupchat.max_round}) reached"
+                break
+            try:
+                # select the next speaker
+                speaker = await groupchat.a_select_speaker(speaker, self)
+                # let the speaker speak
+                reply = await speaker.a_generate_reply(sender=self)
+            except KeyboardInterrupt:
+                # let the admin agent speak if interrupted
+                if groupchat.admin_name in groupchat.agent_names:
+                    # admin agent is one of the participants
+                    speaker = groupchat.agent_by_name(groupchat.admin_name)
+                    reply = await speaker.a_generate_reply(sender=self)
+                else:
+                    # admin agent is not found in the participants
+                    raise
+            except NoEligibleSpeakerError:
+                # No eligible speaker, terminate the conversation
+                termination_reason = "No next speaker selected"
+                break
+
+            if reply is None:
+                # no reply is generated, exit the chat
+                termination_reason = "No reply generated"
+                break
+
+            # The speaker sends the message without requesting a reply
+            await speaker.a_send(reply, self, request_reply=False, silent=silent)
+            message = self.last_message(speaker)
+        if self.client_cache is not None:
+            for a in groupchat.agents:
+                a.client_cache = a.previous_cache
+                a.previous_cache = None
+
+        if termination_reason:
+            iostream.send(TerminationEvent(termination_reason=termination_reason))
+
+        return True, None
+
+    def resume(
+        self,
+        messages: Union[list[dict[str, Any]], str],
+        remove_termination_string: Optional[Union[str, Callable[[str], str]]] = None,
+        silent: Optional[bool] = False,
+    ) -> tuple[ConversableAgent, dict[str, Any]]:
+        """Resumes a group chat using the previous messages as a starting point. Requires the agents, group chat, and group chat manager to be established
+        as per the original group chat.
+
+        Args:
+            messages: The content of the previous chat's messages, either as a Json string or a list of message dictionaries.
+            remove_termination_string: Remove the termination string from the last message to prevent immediate termination
+                If a string is provided, this string will be removed from last message.
+                If a function is provided, the last message will be passed to this function.
+            silent: (Experimental) whether to print the messages for this conversation. Default is False.
+
+        Returns:
+            A tuple containing the last agent who spoke and their message
+        """
+        # Convert messages from string to messages list, if needed
+        if isinstance(messages, str):
+            messages = self.messages_from_string(messages)
+        elif isinstance(messages, list) and all(isinstance(item, dict) for item in messages):
+            messages = copy.deepcopy(messages)
+        else:
+            raise Exception("Messages is not of type str or List[Dict]")
+
+        # Clean up the objects, ensuring there are no messages in the agents and group chat
+
+        # Clear agent message history
+        for agent in self._groupchat.agents:
+            if isinstance(agent, ConversableAgent):
+                agent.clear_history()
+
+        # Clear Manager message history
+        self.clear_history()
+
+        # Clear GroupChat messages
+        self._groupchat.reset()
+
+        # Validation of message and agents
+
+        try:
+            self._valid_resume_messages(messages)
+        except:
+            raise
+
+        # Load the messages into the group chat
+        for i, message in enumerate(messages):
+            if "name" in message:
+                message_speaker_agent = self._groupchat.agent_by_name(message["name"])
+            else:
+                # If there's no name, assign the group chat manager (this is an indication the ChatResult messages was used instead of groupchat.messages as state)
+                message_speaker_agent = self
+                message["name"] = self.name
+
+            # If it wasn't an agent speaking, it may be the manager
+            if not message_speaker_agent and message["name"] == self.name:
+                message_speaker_agent = self
+
+            # Add previous messages to each agent (except the last message, as we'll kick off the conversation with it)
+            if i != len(messages) - 1:
+                for agent in self._groupchat.agents:
+                    if agent.name == message["name"]:
+                        # An agent`s message is sent to the Group Chat Manager
+                        agent.send(message, self, request_reply=False, silent=True)
+                    else:
+                        # Otherwise, messages are sent from the Group Chat Manager to the agent
+                        self.send(message, agent, request_reply=False, silent=True)
+
+                # Add previous message to the new groupchat, if it's an admin message the name may not match so add the message directly
+                if message_speaker_agent:
+                    self._groupchat.append(message, message_speaker_agent)
+                else:
+                    self._groupchat.messages.append(message)
+
+            # Last speaker agent
+            last_speaker_name = message["name"]
+
+            # Last message to check for termination (we could avoid this by ignoring termination check for resume in the future)
+            last_message = message
+
+        # Get last speaker as an agent
+        previous_last_agent = self._groupchat.agent_by_name(name=last_speaker_name)
+
+        # If we didn't match a last speaker agent, we check that it's the group chat's admin name and assign the manager, if so
+        if not previous_last_agent and (
+            last_speaker_name == self._groupchat.admin_name or last_speaker_name == self.name
+        ):
+            previous_last_agent = self
+
+        # Termination removal and check
+        self._process_resume_termination(remove_termination_string, messages)
+
+        if not silent:
+            iostream = IOStream.get_default()
+            iostream.send(GroupChatResumeEvent(last_speaker_name=last_speaker_name, events=messages, silent=silent))
+
+        # Update group chat settings for resuming
+        self._groupchat.send_introductions = False
+
+        return previous_last_agent, last_message
+
+    async def a_resume(
+        self,
+        messages: Union[list[dict[str, Any]], str],
+        remove_termination_string: Optional[Union[str, Callable[[str], str]]] = None,
+        silent: Optional[bool] = False,
+    ) -> tuple[ConversableAgent, dict[str, Any]]:
+        """Resumes a group chat using the previous messages as a starting point, asynchronously. Requires the agents, group chat, and group chat manager to be established
+        as per the original group chat.
+
+        Args:
+            messages: The content of the previous chat's messages, either as a Json string or a list of message dictionaries.
+            remove_termination_string: Remove the termination string from the last message to prevent immediate termination
+                If a string is provided, this string will be removed from last message.
+                If a function is provided, the last message will be passed to this function, and the function returns the string after processing.
+            silent: (Experimental) whether to print the messages for this conversation. Default is False.
+
+        Returns:
+            A tuple containing the last agent who spoke and their message
+        """
+        # Convert messages from string to messages list, if needed
+        if isinstance(messages, str):
+            messages = self.messages_from_string(messages)
+        elif isinstance(messages, list) and all(isinstance(item, dict) for item in messages):
+            messages = copy.deepcopy(messages)
+        else:
+            raise Exception("Messages is not of type str or List[Dict]")
+
+        # Clean up the objects, ensuring there are no messages in the agents and group chat
+
+        # Clear agent message history
+        for agent in self._groupchat.agents:
+            if isinstance(agent, ConversableAgent):
+                agent.clear_history()
+
+        # Clear Manager message history
+        self.clear_history()
+
+        # Clear GroupChat messages
+        self._groupchat.reset()
+
+        # Validation of message and agents
+
+        try:
+            self._valid_resume_messages(messages)
+        except:
+            raise
+
+        # Load the messages into the group chat
+        for i, message in enumerate(messages):
+            if "name" in message:
+                message_speaker_agent = self._groupchat.agent_by_name(message["name"])
+            else:
+                # If there's no name, assign the group chat manager (this is an indication the ChatResult messages was used instead of groupchat.messages as state)
+                message_speaker_agent = self
+                message["name"] = self.name
+
+            # If it wasn't an agent speaking, it may be the manager
+            if not message_speaker_agent and message["name"] == self.name:
+                message_speaker_agent = self
+
+            # Add previous messages to each agent (except the last message, as we'll kick off the conversation with it)
+            if i != len(messages) - 1:
+                for agent in self._groupchat.agents:
+                    if agent.name == message["name"]:
+                        # An agent`s message is sent to the Group Chat Manager
+                        await agent.a_send(message, self, request_reply=False, silent=True)
+                    else:
+                        # Otherwise, messages are sent from the Group Chat Manager to the agent
+                        await self.a_send(message, agent, request_reply=False, silent=True)
+
+                # Add previous message to the new groupchat, if it's an admin message the name may not match so add the message directly
+                if message_speaker_agent:
+                    self._groupchat.append(message, message_speaker_agent)
+                else:
+                    self._groupchat.messages.append(message)
+
+            # Last speaker agent
+            last_speaker_name = message["name"]
+
+            # Last message to check for termination (we could avoid this by ignoring termination check for resume in the future)
+            last_message = message
+
+        # Get last speaker as an agent
+        previous_last_agent = self._groupchat.agent_by_name(name=last_speaker_name)
+
+        # If we didn't match a last speaker agent, we check that it's the group chat's admin name and assign the manager, if so
+        if not previous_last_agent and (
+            last_speaker_name == self._groupchat.admin_name or last_speaker_name == self.name
+        ):
+            previous_last_agent = self
+
+        # Termination removal and check
+        self._process_resume_termination(remove_termination_string, messages)
+
+        if not silent:
+            iostream = IOStream.get_default()
+            iostream.send(GroupChatResumeEvent(last_speaker_name=last_speaker_name, events=messages, silent=silent))
+
+        # Update group chat settings for resuming
+        self._groupchat.send_introductions = False
+
+        return previous_last_agent, last_message
+
+    def _valid_resume_messages(self, messages: list[dict[str, Any]]):
+        """Validates the messages used for resuming
+
+        Args:
+            messages (List[Dict]): list of messages to resume with
+
+        Returns:
+            - bool: Whether they are valid for resuming
+        """
+        # Must have messages to start with, otherwise they should run run_chat
+        if not messages:
+            raise Exception(
+                "Cannot resume group chat as no messages were provided. Use GroupChatManager.run_chat or ConversableAgent.initiate_chat to start a new chat."
+            )
+
+        # Check that all agents in the chat messages exist in the group chat
+        for message in messages:
+            if message.get("name") and (
+                not self._groupchat.agent_by_name(message["name"])
+                and not message["name"] == self._groupchat.admin_name  # ignore group chat's name
+                and not message["name"] == self.name  # ignore group chat manager's name
+            ):
+                raise Exception(f"Agent name in message doesn't exist as agent in group chat: {message['name']}")
+
+    def _process_resume_termination(
+        self, remove_termination_string: Union[str, Callable[[str], str]], messages: list[dict[str, Any]]
+    ):
+        """Removes termination string, if required, and checks if termination may occur.
+
+        Args:
+            remove_termination_string: Remove the termination string from the last message to prevent immediate termination
+                If a string is provided, this string will be removed from last message.
+                If a function is provided, the last message will be passed to this function, and the function returns the string after processing.
+            messages: List of chat messages
+
+        Returns:
+            None
+        """
+        last_message = messages[-1]
+
+        # Replace any given termination string in the last message
+        if isinstance(remove_termination_string, str):
+
+            def _remove_termination_string(content: str) -> str:
+                return content.replace(remove_termination_string, "")
+
+        else:
+            _remove_termination_string = remove_termination_string
+
+        if _remove_termination_string and messages[-1].get("content"):
+            messages[-1]["content"] = _remove_termination_string(messages[-1]["content"])
+
+        # Check if the last message meets termination (if it has one)
+        if self._is_termination_msg and self._is_termination_msg(last_message):
+            logger.warning("WARNING: Last message meets termination criteria and this may terminate the chat.")
+
+    def messages_from_string(self, message_string: str) -> list[dict[str, Any]]:
+        """Reads the saved state of messages in Json format for resume and returns as a messages list
+
+        Args:
+            message_string: Json string, the saved state
+
+        Returns:
+            A list of messages
+        """
+        try:
+            state = json.loads(message_string)
+        except json.JSONDecodeError:
+            raise Exception("Messages string is not a valid JSON string")
+
+        return state
+
+    def messages_to_string(self, messages: list[dict[str, Any]]) -> str:
+        """Converts the provided messages into a Json string that can be used for resuming the chat.
+        The state is made up of a list of messages
+
+        Args:
+            messages: set of messages to convert to a string
+
+        Returns:
+            A JSON representation of the messages which can be persisted for resuming later
+        """
+        return json.dumps(messages)
+
+    def _raise_exception_on_async_reply_functions(self) -> None:
+        """Raise an exception if any async reply functions are registered.
+
+        Raises:
+            RuntimeError: if any async reply functions are registered.
+        """
+        super()._raise_exception_on_async_reply_functions()
+
+        for agent in self._groupchat.agents:
+            agent._raise_exception_on_async_reply_functions()
+
+    def clear_agents_history(self, reply: dict[str, Any], groupchat: GroupChat) -> str:
+        """Clears history of messages for all agents or selected one. Can preserve selected number of last messages.
+        That function is called when user manually provide "clear history" phrase in his reply.
+        When "clear history" is provided, the history of messages for all agents is cleared.
+        When "clear history `<agent_name>`" is provided, the history of messages for selected agent is cleared.
+        When "clear history `<nr_of_messages_to_preserve>`" is provided, the history of messages for all agents is cleared
+        except last `<nr_of_messages_to_preserve>` messages.
+        When "clear history `<agent_name>` `<nr_of_messages_to_preserve>`" is provided, the history of messages for selected
+        agent is cleared except last `<nr_of_messages_to_preserve>` messages.
+        Phrase "clear history" and optional arguments are cut out from the reply before it passed to the chat.
+
+        Args:
+            reply (dict): reply message dict to analyze.
+            groupchat (GroupChat): GroupChat object.
+        """
+        iostream = IOStream.get_default()
+
+        reply_content = reply["content"]
+        # Split the reply into words
+        words = reply_content.split()
+        # Find the position of "clear" to determine where to start processing
+        clear_word_index = next(i for i in reversed(range(len(words))) if words[i].upper() == "CLEAR")
+        # Extract potential agent name and steps
+        words_to_check = words[clear_word_index + 2 : clear_word_index + 4]
+        nr_messages_to_preserve = None
+        nr_messages_to_preserve_provided = False
+        agent_to_memory_clear = None
+
+        for word in words_to_check:
+            if word.isdigit():
+                nr_messages_to_preserve = int(word)
+                nr_messages_to_preserve_provided = True
+            elif word[:-1].isdigit():  # for the case when number of messages is followed by dot or other sign
+                nr_messages_to_preserve = int(word[:-1])
+                nr_messages_to_preserve_provided = True
+            else:
+                for agent in groupchat.agents:
+                    if agent.name == word or agent.name == word[:-1]:
+                        agent_to_memory_clear = agent
+                        break
+        # preserve last tool call message if clear history called inside of tool response
+        if "tool_responses" in reply and not nr_messages_to_preserve:
+            nr_messages_to_preserve = 1
+            logger.warning(
+                "The last tool call message will be saved to prevent errors caused by tool response without tool call."
+            )
+        # clear history
+        iostream.send(
+            ClearAgentsHistoryEvent(agent=agent_to_memory_clear, nr_events_to_preserve=nr_messages_to_preserve)
+        )
+        if agent_to_memory_clear:
+            agent_to_memory_clear.clear_history(nr_messages_to_preserve=nr_messages_to_preserve)
+        else:
+            if nr_messages_to_preserve:
+                # clearing history for groupchat here
+                temp = groupchat.messages[-nr_messages_to_preserve:]
+                groupchat.messages.clear()
+                groupchat.messages.extend(temp)
+            else:
+                # clearing history for groupchat here
+                groupchat.messages.clear()
+            # clearing history for agents
+            for agent in groupchat.agents:
+                agent.clear_history(nr_messages_to_preserve=nr_messages_to_preserve)
+
+        # Reconstruct the reply without the "clear history" command and parameters
+        skip_words_number = 2 + int(bool(agent_to_memory_clear)) + int(nr_messages_to_preserve_provided)
+        reply_content = " ".join(words[:clear_word_index] + words[clear_word_index + skip_words_number :])
+
+        return reply_content
diff --git a/mm_agents/coact/autogen/agentchat/realtime/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/__init__.py
new file mode 100644
index 0000000..1cce1a2
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/__init__.py
@@ -0,0 +1,3 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/__init__.py
new file mode 100644
index 0000000..1561d7f
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/__init__.py
@@ -0,0 +1,20 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .audio_adapters import TwilioAudioAdapter, WebSocketAudioAdapter
+from .audio_observer import AudioObserver
+from .function_observer import FunctionObserver
+from .realtime_agent import RealtimeAgent
+from .realtime_observer import RealtimeObserver
+from .realtime_swarm import register_swarm
+
+__all__ = [
+    "AudioObserver",
+    "FunctionObserver",
+    "RealtimeAgent",
+    "RealtimeObserver",
+    "TwilioAudioAdapter",
+    "WebSocketAudioAdapter",
+    "register_swarm",
+]
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/__init__.py
new file mode 100644
index 0000000..90d269c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/__init__.py
@@ -0,0 +1,8 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .twilio_audio_adapter import TwilioAudioAdapter
+from .websocket_audio_adapter import WebSocketAudioAdapter
+
+__all__ = ["TwilioAudioAdapter", "WebSocketAudioAdapter"]
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py
new file mode 100644
index 0000000..592b6a0
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py
@@ -0,0 +1,148 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import base64
+import json
+from logging import Logger
+from typing import TYPE_CHECKING, Optional
+
+from .....doc_utils import export_module
+from ..realtime_events import AudioDelta, RealtimeEvent, SpeechStarted
+from ..realtime_observer import RealtimeObserver
+
+if TYPE_CHECKING:
+    from ..websockets import WebSocketProtocol as WebSocket
+
+
+LOG_EVENT_TYPES = [
+    "error",
+    "response.content.done",
+    "rate_limits.updated",
+    "response.done",
+    "input_audio_buffer.committed",
+    "input_audio_buffer.speech_stopped",
+    "input_audio_buffer.speech_started",
+    "session.created",
+]
+SHOW_TIMING_MATH = False
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class TwilioAudioAdapter(RealtimeObserver):
+    """Adapter for streaming audio from Twilio to OpenAI Realtime API and vice versa."""
+
+    def __init__(self, websocket: "WebSocket", *, logger: Optional[Logger] = None):
+        """Adapter for streaming audio from Twilio to OpenAI Realtime API and vice versa.
+
+        Args:
+            websocket: the websocket connection to the Twilio service
+            logger: the logger to use for logging events
+        """
+        super().__init__(logger=logger)
+        self.websocket = websocket
+
+        # Connection specific state
+        self.stream_sid = None
+        self.latest_media_timestamp = 0
+        self.last_assistant_item: Optional[str] = None
+        self.mark_queue: list[str] = []
+        self.response_start_timestamp_twilio: Optional[int] = None
+
+    async def on_event(self, event: RealtimeEvent) -> None:
+        """Receive events from the OpenAI Realtime API, send audio back to Twilio."""
+        logger = self.logger
+
+        if isinstance(event, AudioDelta):
+            audio_payload = base64.b64encode(base64.b64decode(event.delta)).decode("utf-8")
+            audio_delta = {"event": "media", "streamSid": self.stream_sid, "media": {"payload": audio_payload}}
+            await self.websocket.send_json(audio_delta)
+
+            if self.response_start_timestamp_twilio is None:
+                self.response_start_timestamp_twilio = self.latest_media_timestamp
+                if SHOW_TIMING_MATH:
+                    logger.info(f"Setting start timestamp for new response: {self.response_start_timestamp_twilio}ms")
+
+            # Update last_assistant_item safely
+            if event.item_id:
+                self.last_assistant_item = event.item_id
+
+            await self.send_mark()
+
+        # Trigger an interruption. Your use case might work better using `input_audio_buffer.speech_stopped`, or combining the two.
+        if isinstance(event, SpeechStarted):
+            logger.info("Speech start detected.")
+            if self.last_assistant_item:
+                logger.info(f"Interrupting response with id: {self.last_assistant_item}")
+                await self.handle_speech_started_event()
+
+    async def handle_speech_started_event(self) -> None:
+        """Handle interruption when the caller's speech starts."""
+        logger = self.logger
+
+        logger.info("Handling speech started event.")
+        if self.mark_queue and self.response_start_timestamp_twilio is not None:
+            elapsed_time = self.latest_media_timestamp - self.response_start_timestamp_twilio
+            if SHOW_TIMING_MATH:
+                logger.info(
+                    f"Calculating elapsed time for truncation: {self.latest_media_timestamp} - {self.response_start_timestamp_twilio} = {elapsed_time}ms"
+                )
+
+            if self.last_assistant_item:
+                if SHOW_TIMING_MATH:
+                    logger.info(f"Truncating item with ID: {self.last_assistant_item}, Truncated at: {elapsed_time}ms")
+
+                await self.realtime_client.truncate_audio(
+                    audio_end_ms=elapsed_time,
+                    content_index=0,
+                    item_id=self.last_assistant_item,
+                )
+
+            await self.websocket.send_json({"event": "clear", "streamSid": self.stream_sid})
+
+            self.mark_queue.clear()
+            self.last_assistant_item = None
+            self.response_start_timestamp_twilio = None
+
+    async def send_mark(self) -> None:
+        """Send a mark of audio interruption to the Twilio websocket."""
+        if self.stream_sid:
+            mark_event = {"event": "mark", "streamSid": self.stream_sid, "mark": {"name": "responsePart"}}
+            await self.websocket.send_json(mark_event)
+            self.mark_queue.append("responsePart")
+
+    async def run_loop(self) -> None:
+        """Run the adapter loop."""
+        logger = self.logger
+
+        async for message in self.websocket.iter_text():
+            try:
+                data = json.loads(message)
+                if data["event"] == "media":
+                    self.latest_media_timestamp = int(data["media"]["timestamp"])
+                    await self.realtime_client.send_audio(audio=data["media"]["payload"])
+                elif data["event"] == "start":
+                    self.stream_sid = data["start"]["streamSid"]
+                    logger.info(f"Incoming stream has started {self.stream_sid}")
+                    self.response_start_timestamp_twilio = None
+                    self.latest_media_timestamp = 0
+                    self.last_assistant_item = None
+                elif data["event"] == "mark":
+                    if self.mark_queue:
+                        self.mark_queue.pop(0)
+            except Exception as e:
+                logger.warning(f"Error processing Twilio message: {e}", stack_info=True)
+
+    async def initialize_session(self) -> None:
+        """Control initial session with OpenAI."""
+        session_update = {
+            "input_audio_format": "g711_ulaw",
+            "output_audio_format": "g711_ulaw",
+        }
+        await self.realtime_client.session_update(session_update)
+
+
+if TYPE_CHECKING:
+
+    def twilio_audio_adapter(websocket: "WebSocket") -> RealtimeObserver:
+        return TwilioAudioAdapter(websocket)
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py
new file mode 100644
index 0000000..7f1335f
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py
@@ -0,0 +1,139 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import base64
+import json
+from logging import Logger
+from typing import TYPE_CHECKING, Optional
+
+from .....doc_utils import export_module
+from ..realtime_events import AudioDelta, RealtimeEvent, SpeechStarted
+from ..realtime_observer import RealtimeObserver
+
+if TYPE_CHECKING:
+    from ..websockets import WebSocketProtocol as WebSocket
+
+LOG_EVENT_TYPES = [
+    "error",
+    "response.content.done",
+    "rate_limits.updated",
+    "response.done",
+    "input_audio_buffer.committed",
+    "input_audio_buffer.speech_stopped",
+    "input_audio_buffer.speech_started",
+    "session.created",
+]
+SHOW_TIMING_MATH = False
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class WebSocketAudioAdapter(RealtimeObserver):
+    def __init__(self, websocket: "WebSocket", *, logger: Optional[Logger] = None) -> None:
+        """Observer for handling function calls from the OpenAI Realtime API.
+
+        Args:
+            websocket (WebSocket): The websocket connection.
+            logger (Logger): The logger for the observer.
+        """
+        super().__init__(logger=logger)
+        self.websocket = websocket
+
+        # Connection specific state
+        self.stream_sid = None
+        self.latest_media_timestamp = 0
+        self.last_assistant_item: Optional[str] = None
+        self.mark_queue: list[str] = []
+        self.response_start_timestamp_socket: Optional[int] = None
+
+    async def on_event(self, event: RealtimeEvent) -> None:
+        """Receive events from the OpenAI Realtime API, send audio back to websocket."""
+        logger = self.logger
+
+        if isinstance(event, AudioDelta):
+            audio_payload = base64.b64encode(base64.b64decode(event.delta)).decode("utf-8")
+            audio_delta = {"event": "media", "streamSid": self.stream_sid, "media": {"payload": audio_payload}}
+            await self.websocket.send_json(audio_delta)
+
+            if self.response_start_timestamp_socket is None:
+                self.response_start_timestamp_socket = self.latest_media_timestamp
+                if SHOW_TIMING_MATH:
+                    logger.info(f"Setting start timestamp for new response: {self.response_start_timestamp_socket}ms")
+
+            # Update last_assistant_item safely
+            if event.item_id:
+                self.last_assistant_item = event.item_id
+
+            await self.send_mark()
+
+        # Trigger an interruption. Your use case might work better using `input_audio_buffer.speech_stopped`, or combining the two.
+        if isinstance(event, SpeechStarted):
+            logger.info("Speech start detected.")
+            if self.last_assistant_item:
+                logger.info(f"Interrupting response with id: {self.last_assistant_item}")
+                await self.handle_speech_started_event()
+
+    async def handle_speech_started_event(self) -> None:
+        """Handle interruption when the caller's speech starts."""
+        logger = self.logger
+        logger.info("Handling speech started event.")
+        if self.mark_queue and self.response_start_timestamp_socket is not None:
+            elapsed_time = self.latest_media_timestamp - self.response_start_timestamp_socket
+            if SHOW_TIMING_MATH:
+                logger.info(
+                    f"Calculating elapsed time for truncation: {self.latest_media_timestamp} - {self.response_start_timestamp_socket} = {elapsed_time}ms"
+                )
+
+            if self.last_assistant_item:
+                if SHOW_TIMING_MATH:
+                    logger.info(f"Truncating item with ID: {self.last_assistant_item}, Truncated at: {elapsed_time}ms")
+
+                await self.realtime_client.truncate_audio(
+                    audio_end_ms=elapsed_time,
+                    content_index=0,
+                    item_id=self.last_assistant_item,
+                )
+
+            await self.websocket.send_json({"event": "clear", "streamSid": self.stream_sid})
+
+            self.mark_queue.clear()
+            self.last_assistant_item = None
+            self.response_start_timestamp_socket = None
+
+    async def send_mark(self) -> None:
+        if self.stream_sid:
+            mark_event = {"event": "mark", "streamSid": self.stream_sid, "mark": {"name": "responsePart"}}
+            await self.websocket.send_json(mark_event)
+            self.mark_queue.append("responsePart")
+
+    async def initialize_session(self) -> None:
+        """Control initial session with OpenAI."""
+        session_update = {"input_audio_format": "pcm16", "output_audio_format": "pcm16"}
+        await self.realtime_client.session_update(session_update)
+
+    async def run_loop(self) -> None:
+        """Reads data from websocket and sends it to the RealtimeClient."""
+        logger = self.logger
+        async for message in self.websocket.iter_text():
+            try:
+                data = json.loads(message)
+                if data["event"] == "media":
+                    self.latest_media_timestamp = int(data["media"]["timestamp"])
+                    await self.realtime_client.send_audio(audio=data["media"]["payload"])
+                elif data["event"] == "start":
+                    self.stream_sid = data["start"]["streamSid"]
+                    logger.info(f"Incoming stream has started {self.stream_sid}")
+                    self.response_start_timestamp_socket = None
+                    self.latest_media_timestamp = 0
+                    self.last_assistant_item = None
+                elif data["event"] == "mark":
+                    if self.mark_queue:
+                        self.mark_queue.pop(0)
+            except Exception as e:
+                logger.warning(f"Failed to process message: {e}", stack_info=True)
+
+
+if TYPE_CHECKING:
+
+    def websocket_audio_adapter(websocket: "WebSocket") -> RealtimeObserver:
+        return WebSocketAudioAdapter(websocket)
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_observer.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_observer.py
new file mode 100644
index 0000000..dfa4ca6
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/audio_observer.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING, Optional
+
+from ....doc_utils import export_module
+from .realtime_events import InputAudioBufferDelta, RealtimeEvent
+from .realtime_observer import RealtimeObserver
+
+if TYPE_CHECKING:
+    from logging import Logger
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class AudioObserver(RealtimeObserver):
+    """Observer for user voice input"""
+
+    def __init__(self, *, logger: Optional["Logger"] = None) -> None:
+        """Observer for user voice input"""
+        super().__init__(logger=logger)
+
+    async def on_event(self, event: RealtimeEvent) -> None:
+        """Observe voice input events from the Realtime.
+
+        Args:
+            event (dict[str, Any]): The event from the OpenAI Realtime API.
+        """
+        if isinstance(event, InputAudioBufferDelta):
+            self.logger.info("Received audio buffer delta")
+
+    async def initialize_session(self) -> None:
+        """No need to initialize session from this observer"""
+        pass
+
+    async def run_loop(self) -> None:
+        """Run the observer loop."""
+        pass
+
+
+if TYPE_CHECKING:
+    function_observer: RealtimeObserver = AudioObserver()
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/__init__.py
new file mode 100644
index 0000000..23e90a6
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/__init__.py
@@ -0,0 +1,15 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .gemini.client import GeminiRealtimeClient
+from .oai.base_client import OpenAIRealtimeClient
+from .realtime_client import RealtimeClientProtocol, Role, get_client
+
+__all__ = [
+    "GeminiRealtimeClient",
+    "OpenAIRealtimeClient",
+    "RealtimeClientProtocol",
+    "Role",
+    "get_client",
+]
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/__init__.py
new file mode 100644
index 0000000..bec9e2c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .client import GeminiRealtimeClient
+
+__all__ = ["GeminiRealtimeClient"]
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/client.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/client.py
new file mode 100644
index 0000000..fa6a76a
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/gemini/client.py
@@ -0,0 +1,274 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+from collections.abc import AsyncGenerator
+from contextlib import asynccontextmanager
+from logging import Logger, getLogger
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+
+from ......doc_utils import export_module
+from ......import_utils import optional_import_block, require_optional_import
+from ......llm_config import LLMConfig
+from ...realtime_events import AudioDelta, FunctionCall, RealtimeEvent, SessionCreated
+from ..realtime_client import RealtimeClientBase, Role, register_realtime_client
+
+with optional_import_block():
+    from websockets.asyncio.client import connect
+
+
+if TYPE_CHECKING:
+    from websockets.asyncio.client import ClientConnection
+
+    from ..realtime_client import RealtimeClientProtocol
+
+__all__ = ["GeminiRealtimeClient"]
+
+global_logger = getLogger(__name__)
+
+
+HOST = "generativelanguage.googleapis.com"
+API_VERSION = "v1alpha"
+
+
+@register_realtime_client()
+@require_optional_import("websockets", "gemini", except_for=["get_factory", "__init__"])
+@export_module("autogen.agentchat.realtime.experimental.clients")
+class GeminiRealtimeClient(RealtimeClientBase):
+    """(Experimental) Client for Gemini Realtime API."""
+
+    def __init__(
+        self,
+        *,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        logger: Optional[Logger] = None,
+    ) -> None:
+        """(Experimental) Client for Gemini Realtime API.
+
+        Args:
+            llm_config: The config for the client.
+            logger: The logger for the client.
+        """
+        super().__init__()
+        self._llm_config = llm_config
+        self._logger = logger
+
+        self._connection: Optional["ClientConnection"] = None
+        config = llm_config["config_list"][0]
+
+        self._model: str = config["model"]
+        self._voice = config.get("voice", "charon")
+        self._temperature: float = config.get("temperature", 0.8)  # type: ignore[union-attr]
+
+        self._response_modality = "AUDIO"
+
+        self._api_key = config.get("api_key", None)
+        # todo: add test with base_url just to make sure it works
+        self._base_url: str = config.get(
+            "base_url",
+            f"wss://{HOST}/ws/google.ai.generativelanguage.{API_VERSION}.GenerativeService.BidiGenerateContent?key={self._api_key}",
+        )
+        self._final_config: dict[str, Any] = {}
+        self._pending_session_updates: dict[str, Any] = {}
+        self._is_reading_events = False
+
+    @property
+    def logger(self) -> Logger:
+        """Get the logger for the Gemini Realtime API."""
+        return self._logger or global_logger
+
+    @property
+    def connection(self) -> "ClientConnection":
+        """Get the Gemini WebSocket connection."""
+        if self._connection is None:
+            raise RuntimeError("Gemini WebSocket is not initialized")
+        return self._connection
+
+    async def send_function_result(self, call_id: str, result: str) -> None:
+        """Send the result of a function call to the Gemini Realtime API.
+
+        Args:
+            call_id (str): The ID of the function call.
+            result (str): The result of the function call.
+        """
+        msg = {
+            "tool_response": {"function_responses": [{"id": call_id, "response": {"result": {"string_value": result}}}]}
+        }
+        if self._is_reading_events:
+            await self.connection.send(json.dumps(msg))
+
+    async def send_text(self, *, role: Role, text: str, turn_complete: bool = True) -> None:
+        """Send a text message to the Gemini Realtime API.
+
+        Args:
+            role: The role of the message.
+            text: The text of the message.
+            turn_complete: A flag indicating if the turn is complete.
+        """
+        msg = {
+            "client_content": {
+                "turn_complete": turn_complete,
+                "turns": [{"role": role, "parts": [{"text": text}]}],
+            }
+        }
+        if self._is_reading_events:
+            await self.connection.send(json.dumps(msg))
+
+    async def send_audio(self, audio: str) -> None:
+        """Send audio to the Gemini Realtime API.
+
+        Args:
+            audio (str): The audio to send.
+        """
+        msg = {
+            "realtime_input": {
+                "media_chunks": [
+                    {
+                        "data": audio,
+                        "mime_type": "audio/pcm",
+                    }
+                ]
+            }
+        }
+        await self.queue_input_audio_buffer_delta(audio)
+        if self._is_reading_events:
+            await self.connection.send(json.dumps(msg))
+
+    async def truncate_audio(self, audio_end_ms: int, content_index: int, item_id: str) -> None:
+        self.logger.info("This is not natively supported by Gemini Realtime API.")
+        pass
+
+    async def _initialize_session(self) -> None:
+        """Initialize the session with the Gemini Realtime API."""
+        session_config = {
+            "setup": {
+                "system_instruction": {
+                    "role": "system",
+                    "parts": [{"text": self._pending_session_updates.get("instructions", "")}],
+                },
+                "model": f"models/{self._model}",
+                "tools": [
+                    {
+                        "function_declarations": [
+                            {
+                                "name": tool_schema["name"],
+                                "description": tool_schema["description"],
+                                "parameters": tool_schema["parameters"],
+                            }
+                            for tool_schema in self._pending_session_updates.get("tools", [])
+                        ]
+                    },
+                ],
+                "generation_config": {
+                    "response_modalities": [self._response_modality],
+                    "speech_config": {"voiceConfig": {"prebuiltVoiceConfig": {"voiceName": self._voice}}},
+                    "temperature": self._temperature,
+                },
+            }
+        }
+
+        self.logger.info(f"Sending session update: {session_config}")
+        await self.connection.send(json.dumps(session_config))
+
+    async def session_update(self, session_options: dict[str, Any]) -> None:
+        """Record session updates to be applied when the connection is established.
+
+        Args:
+            session_options (dict[str, Any]): The session options to update.
+        """
+        if self._is_reading_events:
+            self.logger.warning("Is reading events. Session update will be ignored.")
+        else:
+            self._pending_session_updates.update(session_options)
+
+    @asynccontextmanager
+    async def connect(self) -> AsyncGenerator[None, None]:
+        """Connect to the Gemini Realtime API."""
+        try:
+            async with connect(
+                self._base_url, additional_headers={"Content-Type": "application/json"}
+            ) as self._connection:
+                yield
+        finally:
+            self._connection = None
+
+    async def read_events(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read Events from the Gemini Realtime Client"""
+        if self._connection is None:
+            raise RuntimeError("Client is not connected, call connect() first.")
+        await self._initialize_session()
+
+        self._is_reading_events = True
+
+        async for event in self._read_events():
+            yield event
+
+    async def _read_from_connection(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read messages from the Gemini Realtime connection."""
+        async for raw_message in self.connection:
+            message = raw_message.decode("ascii") if isinstance(raw_message, bytes) else raw_message
+            events = self._parse_message(json.loads(message))
+            for event in events:
+                yield event
+
+    def _parse_message(self, response: dict[str, Any]) -> list[RealtimeEvent]:
+        """Parse a message from the Gemini Realtime API.
+
+        Args:
+            response (dict[str, Any]): The response to parse.
+
+        Returns:
+            list[RealtimeEvent]: The parsed events.
+        """
+        if "serverContent" in response and "modelTurn" in response["serverContent"]:
+            try:
+                b64data = response["serverContent"]["modelTurn"]["parts"][0]["inlineData"].pop("data")
+                return [
+                    AudioDelta(
+                        delta=b64data,
+                        item_id=None,
+                        raw_message=response,
+                    )
+                ]
+            except KeyError:
+                return []
+        elif "toolCall" in response:
+            return [
+                FunctionCall(
+                    raw_message=response,
+                    call_id=call["id"],
+                    name=call["name"],
+                    arguments=call["args"],
+                )
+                for call in response["toolCall"]["functionCalls"]
+            ]
+        elif "setupComplete" in response:
+            return [
+                SessionCreated(raw_message=response),
+            ]
+        else:
+            return [RealtimeEvent(raw_message=response)]
+
+    @classmethod
+    def get_factory(
+        cls, llm_config: Union[LLMConfig, dict[str, Any]], logger: Logger, **kwargs: Any
+    ) -> Optional[Callable[[], "RealtimeClientProtocol"]]:
+        """Create a Realtime API client.
+
+        Args:
+            llm_config: The LLM config for the client.
+            logger: The logger for the client.
+            **kwargs: Additional arguments.
+
+        Returns:
+            RealtimeClientProtocol: The Realtime API client is returned if the model matches the pattern
+        """
+        if llm_config["config_list"][0].get("api_type") == "google" and list(kwargs.keys()) == []:
+            return lambda: GeminiRealtimeClient(llm_config=llm_config, logger=logger, **kwargs)
+        return None
+
+
+# needed for mypy to check if GeminiRealtimeClient implements RealtimeClientProtocol
+if TYPE_CHECKING:
+    _client: RealtimeClientProtocol = GeminiRealtimeClient(llm_config={})
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/__init__.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/__init__.py
new file mode 100644
index 0000000..52d380a
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/__init__.py
@@ -0,0 +1,8 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .base_client import OpenAIRealtimeClient
+from .rtc_client import OpenAIRealtimeWebRTCClient
+
+__all__ = ["OpenAIRealtimeClient", "OpenAIRealtimeWebRTCClient"]
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/base_client.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/base_client.py
new file mode 100644
index 0000000..1c4953c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/base_client.py
@@ -0,0 +1,220 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from collections.abc import AsyncGenerator
+from contextlib import asynccontextmanager
+from logging import Logger, getLogger
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+
+from ......doc_utils import export_module
+from ......import_utils import optional_import_block, require_optional_import
+from ......llm_config import LLMConfig
+from ...realtime_events import RealtimeEvent
+from ..realtime_client import RealtimeClientBase, Role, register_realtime_client
+from .utils import parse_oai_message
+
+with optional_import_block():
+    from openai import DEFAULT_MAX_RETRIES, NOT_GIVEN, AsyncOpenAI
+    from openai.resources.beta.realtime.realtime import AsyncRealtimeConnection
+
+
+if TYPE_CHECKING:
+    from ..realtime_client import RealtimeClientProtocol
+
+__all__ = ["OpenAIRealtimeClient"]
+
+global_logger = getLogger(__name__)
+
+
+@register_realtime_client()
+@require_optional_import("openai>=1.66.2", "openai-realtime", except_for=["get_factory", "__init__"])
+@export_module("autogen.agentchat.realtime.experimental.clients")
+class OpenAIRealtimeClient(RealtimeClientBase):
+    """(Experimental) Client for OpenAI Realtime API."""
+
+    def __init__(
+        self,
+        *,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        logger: Optional[Logger] = None,
+    ) -> None:
+        """(Experimental) Client for OpenAI Realtime API.
+
+        Args:
+            llm_config: The config for the client.
+            logger: the logger to use for logging events
+        """
+        super().__init__()
+        self._llm_config = llm_config
+        self._logger = logger
+
+        self._connection: Optional["AsyncRealtimeConnection"] = None
+
+        self.config = llm_config["config_list"][0]
+        # model is passed to self._client.beta.realtime.connect function later
+        self._model: str = self.config["model"]
+        self._voice: str = self.config.get("voice", "alloy")
+        self._temperature: float = llm_config.get("temperature", 0.8)  # type: ignore[union-attr]
+
+        self._client: Optional["AsyncOpenAI"] = None
+
+    @property
+    def logger(self) -> Logger:
+        """Get the logger for the OpenAI Realtime API."""
+        return self._logger or global_logger
+
+    @property
+    def connection(self) -> "AsyncRealtimeConnection":
+        """Get the OpenAI WebSocket connection."""
+        if self._connection is None:
+            raise RuntimeError("OpenAI WebSocket is not initialized")
+        return self._connection
+
+    async def send_function_result(self, call_id: str, result: str) -> None:
+        """Send the result of a function call to the OpenAI Realtime API.
+
+        Args:
+            call_id (str): The ID of the function call.
+            result (str): The result of the function call.
+        """
+        await self.connection.conversation.item.create(
+            item={
+                "type": "function_call_output",
+                "call_id": call_id,
+                "output": result,
+            },
+        )
+
+        await self.connection.response.create()
+
+    async def send_text(self, *, role: Role, text: str) -> None:
+        """Send a text message to the OpenAI Realtime API.
+
+        Args:
+            role (str): The role of the message.
+            text (str): The text of the message.
+        """
+        await self.connection.response.cancel()
+        await self.connection.conversation.item.create(
+            item={"type": "message", "role": role, "content": [{"type": "input_text", "text": text}]}
+        )
+        await self.connection.response.create()
+
+    async def send_audio(self, audio: str) -> None:
+        """Send audio to the OpenAI Realtime API.
+
+        Args:
+            audio (str): The audio to send.
+        """
+        await self.queue_input_audio_buffer_delta(audio)
+        await self.connection.input_audio_buffer.append(audio=audio)
+
+    async def truncate_audio(self, audio_end_ms: int, content_index: int, item_id: str) -> None:
+        """Truncate audio in the OpenAI Realtime API.
+
+        Args:
+            audio_end_ms (int): The end of the audio to truncate.
+            content_index (int): The index of the content to truncate.
+            item_id (str): The ID of the item to truncate.
+        """
+        await self.connection.conversation.item.truncate(
+            audio_end_ms=audio_end_ms, content_index=content_index, item_id=item_id
+        )
+
+    async def _initialize_session(self) -> None:
+        """Control initial session with OpenAI."""
+        session_update = {
+            "turn_detection": {"type": "server_vad"},
+            "voice": self._voice,
+            "modalities": ["audio", "text"],
+            "temperature": self._temperature,
+        }
+        await self.session_update(session_options=session_update)
+
+    async def session_update(self, session_options: dict[str, Any]) -> None:
+        """Send a session update to the OpenAI Realtime API.
+
+        Args:
+            session_options (dict[str, Any]): The session options to update.
+        """
+        logger = self.logger
+        logger.info(f"Sending session update: {session_options}")
+        await self.connection.session.update(session=session_options)  # type: ignore[arg-type]
+        logger.info("Sending session update finished")
+
+    @asynccontextmanager
+    async def connect(self) -> AsyncGenerator[None, None]:
+        """Connect to the OpenAI Realtime API."""
+        try:
+            if not self._client:
+                self._client = AsyncOpenAI(
+                    api_key=self.config.get("api_key", None),
+                    organization=self.config.get("organization", None),
+                    project=self.config.get("project", None),
+                    base_url=self.config.get("base_url", None),
+                    websocket_base_url=self.config.get("websocket_base_url", None),
+                    timeout=self.config.get("timeout", NOT_GIVEN),
+                    max_retries=self.config.get("max_retries", DEFAULT_MAX_RETRIES),
+                    default_headers=self.config.get("default_headers", None),
+                    default_query=self.config.get("default_query", None),
+                )
+            async with self._client.beta.realtime.connect(
+                model=self._model,
+            ) as self._connection:
+                await self._initialize_session()
+                yield
+        finally:
+            self._connection = None
+
+    async def read_events(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read messages from the OpenAI Realtime API."""
+        if self._connection is None:
+            raise RuntimeError("Client is not connected, call connect() first.")
+
+        try:
+            async for event in self._read_events():
+                yield event
+
+        finally:
+            self._connection = None
+
+    async def _read_from_connection(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read messages from the OpenAI Realtime API."""
+        async for message in self._connection:
+            for event in self._parse_message(message.model_dump()):
+                yield event
+
+    def _parse_message(self, message: dict[str, Any]) -> list[RealtimeEvent]:
+        """Parse a message from the OpenAI Realtime API.
+
+        Args:
+            message (dict[str, Any]): The message to parse.
+
+        Returns:
+            RealtimeEvent: The parsed event.
+        """
+        return [parse_oai_message(message)]
+
+    @classmethod
+    def get_factory(
+        cls, llm_config: Union[LLMConfig, dict[str, Any]], logger: Logger, **kwargs: Any
+    ) -> Optional[Callable[[], "RealtimeClientProtocol"]]:
+        """Create a Realtime API client.
+
+        Args:
+            llm_config: The config for the client.
+            logger: The logger to use for logging events.
+            kwargs: Additional arguments.
+
+        Returns:
+            RealtimeClientProtocol: The Realtime API client is returned if the model matches the pattern
+        """
+        if llm_config["config_list"][0].get("api_type", "openai") == "openai" and list(kwargs.keys()) == []:
+            return lambda: OpenAIRealtimeClient(llm_config=llm_config, logger=logger, **kwargs)
+        return None
+
+
+# needed for mypy to check if OpenAIRealtimeWebRTCClient implements RealtimeClientProtocol
+if TYPE_CHECKING:
+    _client: RealtimeClientProtocol = OpenAIRealtimeClient(llm_config={})
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py
new file mode 100644
index 0000000..3ba079c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py
@@ -0,0 +1,243 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+from collections.abc import AsyncGenerator
+from contextlib import asynccontextmanager
+from logging import Logger, getLogger
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+
+from autogen.import_utils import optional_import_block, require_optional_import
+
+from ......doc_utils import export_module
+from ......llm_config import LLMConfig
+from ...realtime_events import RealtimeEvent
+from ..realtime_client import RealtimeClientBase, Role, register_realtime_client
+from .utils import parse_oai_message
+
+if TYPE_CHECKING:
+    from ...websockets import WebSocketProtocol as WebSocket
+    from ..realtime_client import RealtimeClientProtocol
+
+with optional_import_block():
+    import httpx
+
+__all__ = ["OpenAIRealtimeWebRTCClient"]
+
+global_logger = getLogger(__name__)
+
+
+@register_realtime_client()
+@require_optional_import("httpx", "openai-realtime", except_for="get_factory")
+@export_module("autogen.agentchat.realtime.experimental.clients.oai")
+class OpenAIRealtimeWebRTCClient(RealtimeClientBase):
+    """(Experimental) Client for OpenAI Realtime API that uses WebRTC protocol."""
+
+    def __init__(
+        self,
+        *,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        websocket: "WebSocket",
+        logger: Optional[Logger] = None,
+    ) -> None:
+        """(Experimental) Client for OpenAI Realtime API.
+
+        Args:
+            llm_config: The config for the client.
+            websocket: the websocket to use for the connection
+            logger: the logger to use for logging events
+        """
+        super().__init__()
+        self._llm_config = llm_config
+        self._logger = logger
+        self._websocket = websocket
+
+        config = llm_config["config_list"][0]
+        self._model: str = config["model"]
+        self._voice: str = config.get("voice", "alloy")
+        self._temperature: float = llm_config.get("temperature", 0.8)  # type: ignore[union-attr]
+        self._config = config
+        self._base_url = config.get("base_url", "https://api.openai.com/v1/realtime/sessions")
+
+    @property
+    def logger(self) -> Logger:
+        """Get the logger for the OpenAI Realtime API."""
+        return self._logger or global_logger
+
+    async def send_function_result(self, call_id: str, result: str) -> None:
+        """Send the result of a function call to the OpenAI Realtime API.
+
+        Args:
+            call_id (str): The ID of the function call.
+            result (str): The result of the function call.
+        """
+        await self._websocket.send_json({
+            "type": "conversation.item.create",
+            "item": {
+                "type": "function_call_output",
+                "call_id": call_id,
+                "output": result,
+            },
+        })
+        await self._websocket.send_json({"type": "response.create"})
+
+    async def send_text(self, *, role: Role, text: str) -> None:
+        """Send a text message to the OpenAI Realtime API.
+
+        Args:
+            role (str): The role of the message.
+            text (str): The text of the message.
+        """
+        # await self.connection.response.cancel() #why is this here?
+        await self._websocket.send_json({
+            "type": "response.cancel",
+        })
+        await self._websocket.send_json({
+            "type": "conversation.item.create",
+            "item": {"type": "message", "role": role, "content": [{"type": "input_text", "text": text}]},
+        })
+        # await self.connection.response.create()
+        await self._websocket.send_json({"type": "response.create"})
+
+    async def send_audio(self, audio: str) -> None:
+        """Send audio to the OpenAI Realtime API.
+        in case of WebRTC, audio is already sent by js client, so we just queue it in order to be logged.
+
+        Args:
+            audio (str): The audio to send.
+        """
+        await self.queue_input_audio_buffer_delta(audio)
+
+    async def truncate_audio(self, audio_end_ms: int, content_index: int, item_id: str) -> None:
+        """Truncate audio in the OpenAI Realtime API.
+
+        Args:
+            audio_end_ms (int): The end of the audio to truncate.
+            content_index (int): The index of the content to truncate.
+            item_id (str): The ID of the item to truncate.
+        """
+        await self._websocket.send_json({
+            "type": "conversation.item.truncate",
+            "content_index": content_index,
+            "item_id": item_id,
+            "audio_end_ms": audio_end_ms,
+        })
+
+    async def session_update(self, session_options: dict[str, Any]) -> None:
+        """Send a session update to the OpenAI Realtime API.
+
+        In the case of WebRTC we can not send it directly, but we can send it
+        to the javascript over the websocket, and rely on it to send session
+        update to OpenAI
+
+        Args:
+            session_options (dict[str, Any]): The session options to update.
+        """
+        logger = self.logger
+        logger.info(f"Sending session update: {session_options}")
+        # await self.connection.session.update(session=session_options)  # type: ignore[arg-type]
+        await self._websocket.send_json({"type": "session.update", "session": session_options})
+        logger.info("Sending session update finished")
+
+    def session_init_data(self) -> list[dict[str, Any]]:
+        """Control initial session with OpenAI."""
+        session_update = {
+            "turn_detection": {"type": "server_vad"},
+            "voice": self._voice,
+            "modalities": ["audio", "text"],
+            "temperature": self._temperature,
+        }
+        return [{"type": "session.update", "session": session_update}]
+
+    async def _initialize_session(self) -> None: ...
+
+    @asynccontextmanager
+    async def connect(self) -> AsyncGenerator[None, None]:
+        """Connect to the OpenAI Realtime API.
+
+        In the case of WebRTC, we pass connection information over the
+        websocket, so that javascript on the other end of websocket open
+        actual connection to OpenAI
+        """
+        try:
+            base_url = self._base_url
+            api_key = self._config.get("api_key", None)
+            headers = {
+                "Authorization": f"Bearer {api_key}",  # Use os.getenv to get from environment
+                "Content-Type": "application/json",
+            }
+            data = {
+                # "model": "gpt-4o-realtime-preview-2024-12-17",
+                "model": self._model,
+                "voice": self._voice,
+            }
+            async with httpx.AsyncClient() as client:
+                response = await client.post(base_url, headers=headers, json=data)
+                response.raise_for_status()
+                json_data = response.json()
+                json_data["model"] = self._model
+            if self._websocket is not None:
+                session_init = self.session_init_data()
+                await self._websocket.send_json({"type": "ag2.init", "config": json_data, "init": session_init})
+            yield
+        finally:
+            pass
+
+    async def read_events(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read events from the OpenAI Realtime API."""
+        async for event in self._read_events():
+            yield event
+
+    async def _read_from_connection(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read messages from the OpenAI Realtime API connection.
+        Again, in case of WebRTC, we do not read OpenAI messages directly since we
+        do not hold connection to OpenAI. Instead we read messages from the websocket, and javascript
+        client on the other side of the websocket that is connected to OpenAI is relaying events to us.
+        """
+        while True:
+            try:
+                message_json = await self._websocket.receive_text()
+                message = json.loads(message_json)
+                for event in self._parse_message(message):
+                    yield event
+            except Exception as e:
+                self.logger.exception(f"Error reading from connection {e}")
+                break
+
+    def _parse_message(self, message: dict[str, Any]) -> list[RealtimeEvent]:
+        """Parse a message from the OpenAI Realtime API.
+
+        Args:
+            message (dict[str, Any]): The message to parse.
+
+        Returns:
+            RealtimeEvent: The parsed event.
+        """
+        return [parse_oai_message(message)]
+
+    @classmethod
+    def get_factory(
+        cls, llm_config: Union[LLMConfig, dict[str, Any]], logger: Logger, **kwargs: Any
+    ) -> Optional[Callable[[], "RealtimeClientProtocol"]]:
+        """Create a Realtime API client.
+
+        Args:
+            llm_config: The config for the client.
+            logger: The logger to use for logging events.
+            **kwargs: Additional arguments.
+
+        Returns:
+            RealtimeClientProtocol: The Realtime API client is returned if the model matches the pattern
+        """
+        if llm_config["config_list"][0].get("api_type", "openai") == "openai" and list(kwargs.keys()) == ["websocket"]:
+            return lambda: OpenAIRealtimeWebRTCClient(llm_config=llm_config, logger=logger, **kwargs)
+
+        return None
+
+
+# needed for mypy to check if OpenAIRealtimeWebRTCClient implements RealtimeClientProtocol
+if TYPE_CHECKING:
+
+    def _rtc_client(websocket: "WebSocket") -> RealtimeClientProtocol:
+        return OpenAIRealtimeWebRTCClient(llm_config={}, websocket=websocket)
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/utils.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/utils.py
new file mode 100644
index 0000000..28c00ea
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/oai/utils.py
@@ -0,0 +1,48 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+from typing import Any
+
+from ...realtime_events import (
+    AudioDelta,
+    FunctionCall,
+    InputAudioBufferDelta,
+    RealtimeEvent,
+    SessionCreated,
+    SessionUpdated,
+    SpeechStarted,
+)
+
+__all__ = ["parse_oai_message"]
+
+
+def parse_oai_message(message: dict[str, Any]) -> RealtimeEvent:
+    """Parse a message from the OpenAI Realtime API.
+
+    Args:
+        message (dict[str, Any]): The message to parse.
+
+    Returns:
+        RealtimeEvent: The parsed event.
+    """
+    if message.get("type") == "session.created":
+        return SessionCreated(raw_message=message)
+    elif message.get("type") == "session.updated":
+        return SessionUpdated(raw_message=message)
+    elif message.get("type") == "response.audio.delta":
+        return AudioDelta(raw_message=message, delta=message["delta"], item_id=message["item_id"])
+    elif message.get("type") == "input_audio_buffer.speech_started":
+        return SpeechStarted(raw_message=message)
+    elif message.get("type") == "input_audio_buffer.delta":
+        return InputAudioBufferDelta(delta=message["delta"], item_id=None, raw_message=message)
+    elif message.get("type") == "response.function_call_arguments.done":
+        return FunctionCall(
+            raw_message=message,
+            call_id=message["call_id"],
+            name=message["name"],
+            arguments=json.loads(message["arguments"]),
+        )
+    else:
+        return RealtimeEvent(raw_message=message)
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/realtime_client.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/realtime_client.py
new file mode 100644
index 0000000..edc6f7a
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/clients/realtime_client.py
@@ -0,0 +1,190 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+from collections.abc import AsyncGenerator
+from logging import Logger
+from typing import Any, AsyncContextManager, Callable, Literal, Optional, Protocol, TypeVar, Union, runtime_checkable
+
+from asyncer import create_task_group
+
+from .....doc_utils import export_module
+from .....llm_config import LLMConfig
+from ..realtime_events import InputAudioBufferDelta, RealtimeEvent
+
+__all__ = ["RealtimeClientProtocol", "Role", "get_client", "register_realtime_client"]
+
+# define role literal type for typing
+Role = Literal["user", "assistant", "system"]
+
+
+@runtime_checkable
+@export_module("autogen.agentchat.realtime.experimental.clients")
+class RealtimeClientProtocol(Protocol):
+    async def send_function_result(self, call_id: str, result: str) -> None:
+        """Send the result of a function call to a Realtime API.
+
+        Args:
+            call_id (str): The ID of the function call.
+            result (str): The result of the function call.
+        """
+        ...
+
+    async def send_text(self, *, role: Role, text: str) -> None:
+        """Send a text message to a Realtime API.
+
+        Args:
+            role (str): The role of the message.
+            text (str): The text of the message.
+        """
+        ...
+
+    async def send_audio(self, audio: str) -> None:
+        """Send audio to a Realtime API.
+
+        Args:
+            audio (str): The audio to send.
+        """
+        ...
+
+    async def truncate_audio(self, audio_end_ms: int, content_index: int, item_id: str) -> None:
+        """Truncate audio in a Realtime API.
+
+        Args:
+            audio_end_ms (int): The end of the audio to truncate.
+            content_index (int): The index of the content to truncate.
+            item_id (str): The ID of the item to truncate.
+        """
+        ...
+
+    async def session_update(self, session_options: dict[str, Any]) -> None:
+        """Send a session update to a Realtime API.
+
+        Args:
+            session_options (dict[str, Any]): The session options to update.
+        """
+        ...
+
+    def connect(self) -> AsyncContextManager[None]: ...
+
+    def read_events(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read events from a Realtime Client."""
+        ...
+
+    async def _read_from_connection(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read events from a Realtime connection."""
+        ...
+
+    def _parse_message(self, message: dict[str, Any]) -> list[RealtimeEvent]:
+        """Parse a message from a Realtime API.
+
+        Args:
+            message (dict[str, Any]): The message to parse.
+
+        Returns:
+            list[RealtimeEvent]: The parsed events.
+        """
+        ...
+
+    @classmethod
+    def get_factory(
+        cls, llm_config: Union[LLMConfig, dict[str, Any]], logger: Logger, **kwargs: Any
+    ) -> Optional[Callable[[], "RealtimeClientProtocol"]]:
+        """Create a Realtime API client.
+
+        Args:
+            llm_config: The config for the client.
+            logger: The logger to use for logging events.
+            **kwargs: Additional arguments.
+
+        Returns:
+            RealtimeClientProtocol: The Realtime API client is returned if the model matches the pattern
+        """
+        ...
+
+
+class RealtimeClientBase:
+    def __init__(self):
+        self._eventQueue = asyncio.Queue()
+
+    async def add_event(self, event: Optional[RealtimeEvent]):
+        await self._eventQueue.put(event)
+
+    async def get_event(self) -> Optional[RealtimeEvent]:
+        return await self._eventQueue.get()
+
+    async def _read_from_connection_task(self):
+        async for event in self._read_from_connection():
+            await self.add_event(event)
+        await self.add_event(None)
+
+    async def _read_events(self) -> AsyncGenerator[RealtimeEvent, None]:
+        """Read events from a Realtime Client."""
+        async with create_task_group() as tg:
+            tg.start_soon(self._read_from_connection_task)
+            while True:
+                try:
+                    event = await self._eventQueue.get()
+                    if event is not None:
+                        yield event
+                    else:
+                        break
+                except Exception:
+                    break
+
+    async def queue_input_audio_buffer_delta(self, audio: str) -> None:
+        """queue InputAudioBufferDelta.
+
+        Args:
+            audio (str): The audio.
+        """
+        await self.add_event(InputAudioBufferDelta(delta=audio, item_id=None, raw_message=dict()))
+
+
+_realtime_client_classes: dict[str, type[RealtimeClientProtocol]] = {}
+
+T = TypeVar("T", bound=RealtimeClientProtocol)
+
+
+def register_realtime_client() -> Callable[[type[T]], type[T]]:
+    """Register a Realtime API client.
+
+    Returns:
+        Callable[[type[T]], type[T]]: The decorator to register the Realtime API client
+    """
+
+    def decorator(client_cls: type[T]) -> type[T]:
+        """Register a Realtime API client.
+
+        Args:
+            client_cls: The client to register.
+        """
+        global _realtime_client_classes
+        fqn = f"{client_cls.__module__}.{client_cls.__name__}"
+        _realtime_client_classes[fqn] = client_cls
+
+        return client_cls
+
+    return decorator
+
+
+@export_module("autogen.agentchat.realtime.experimental.clients")
+def get_client(llm_config: Union[LLMConfig, dict[str, Any]], logger: Logger, **kwargs: Any) -> "RealtimeClientProtocol":
+    """Get a registered Realtime API client.
+
+    Args:
+        llm_config: The config for the client.
+        logger: The logger to use for logging events.
+        **kwargs: Additional arguments.
+
+    Returns:
+        RealtimeClientProtocol: The Realtime API client.
+    """
+    global _realtime_client_classes
+    for _, client_cls in _realtime_client_classes.items():
+        factory = client_cls.get_factory(llm_config=llm_config, logger=logger, **kwargs)
+        if factory:
+            return factory()
+
+    raise ValueError("Realtime API client not found.")
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/function_observer.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/function_observer.py
new file mode 100644
index 0000000..98df085
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/function_observer.py
@@ -0,0 +1,85 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+import json
+from typing import TYPE_CHECKING, Any, Optional
+
+from asyncer import asyncify
+from pydantic import BaseModel
+
+from ....doc_utils import export_module
+from .realtime_events import FunctionCall, RealtimeEvent
+from .realtime_observer import RealtimeObserver
+
+if TYPE_CHECKING:
+    from logging import Logger
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class FunctionObserver(RealtimeObserver):
+    """Observer for handling function calls from the OpenAI Realtime API."""
+
+    def __init__(self, *, logger: Optional["Logger"] = None) -> None:
+        """Observer for handling function calls from the OpenAI Realtime API."""
+        super().__init__(logger=logger)
+
+    async def on_event(self, event: RealtimeEvent) -> None:
+        """Handle function call events from the OpenAI Realtime API.
+
+        Args:
+            event (dict[str, Any]): The event from the OpenAI Realtime API.
+        """
+        if isinstance(event, FunctionCall):
+            self.logger.info("Received function call event")
+            await self.call_function(
+                call_id=event.call_id,
+                name=event.name,
+                kwargs=event.arguments,
+            )
+
+    async def call_function(self, call_id: str, name: str, kwargs: dict[str, Any]) -> None:
+        """Call a function registered with the agent.
+
+        Args:
+            call_id (str): The ID of the function call.
+            name (str): The name of the function to call.
+            kwargs (Any[str, Any]): The arguments to pass to the function.
+        """
+        if name in self.agent.registered_realtime_tools:
+            func = self.agent.registered_realtime_tools[name].func
+            func = func if asyncio.iscoroutinefunction(func) else asyncify(func)
+            try:
+                result = await func(**kwargs)
+            except Exception:
+                result = "Function call failed"
+                self.logger.info(f"Function call failed: {name=}, {kwargs=}", stack_info=True)
+
+            if isinstance(result, BaseModel):
+                result = result.model_dump_json()
+            elif not isinstance(result, str):
+                try:
+                    result = json.dumps(result)
+                except Exception:
+                    result = str(result)
+
+            await self.realtime_client.send_function_result(call_id, result)
+        else:
+            self.logger.warning(f"Function {name} called, but is not registered with the realtime agent.")
+
+    async def initialize_session(self) -> None:
+        """Add registered tools to OpenAI with a session update."""
+        session_update = {
+            "tools": [tool.realtime_tool_schema for tool in self.agent.registered_realtime_tools.values()],
+            "tool_choice": "auto",
+        }
+        await self.realtime_client.session_update(session_update)
+
+    async def run_loop(self) -> None:
+        """Run the observer loop."""
+        pass
+
+
+if TYPE_CHECKING:
+    function_observer: RealtimeObserver = FunctionObserver()
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_agent.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_agent.py
new file mode 100644
index 0000000..703820c
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_agent.py
@@ -0,0 +1,158 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from dataclasses import dataclass
+from logging import Logger, getLogger
+from typing import Any, Callable, Optional, TypeVar, Union
+
+from anyio import lowlevel
+from asyncer import create_task_group
+
+from ....doc_utils import export_module
+from ....llm_config import LLMConfig
+from ....tools import Tool
+from .clients.realtime_client import RealtimeClientProtocol, get_client
+from .function_observer import FunctionObserver
+from .realtime_observer import RealtimeObserver
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+global_logger = getLogger(__name__)
+
+
+@dataclass
+class RealtimeAgentCallbacks:
+    """Callbacks for the Realtime Agent."""
+
+    # async empty placeholder function
+    on_observers_ready: Callable[[], Any] = lambda: lowlevel.checkpoint()
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class RealtimeAgent:
+    def __init__(
+        self,
+        *,
+        name: str,
+        audio_adapter: Optional[RealtimeObserver] = None,
+        system_message: str = "You are a helpful AI Assistant.",
+        llm_config: Optional[Union[LLMConfig, dict[str, Any]]] = None,
+        logger: Optional[Logger] = None,
+        observers: Optional[list[RealtimeObserver]] = None,
+        **client_kwargs: Any,
+    ):
+        """(Experimental) Agent for interacting with the Realtime Clients.
+
+        Args:
+            name (str): The name of the agent.
+            audio_adapter (Optional[RealtimeObserver] = None): The audio adapter for the agent.
+            system_message (str): The system message for the agent.
+            llm_config (LLMConfig, dict[str, Any], bool): The config for the agent.
+            logger (Optional[Logger]): The logger for the agent.
+            observers (Optional[list[RealtimeObserver]]): The additional observers for the agent.
+            **client_kwargs (Any): The keyword arguments for the client.
+        """
+        self._logger = logger
+        self._name = name
+        self._system_message = system_message
+
+        llm_config = LLMConfig.get_current_llm_config(llm_config)
+
+        self._realtime_client: RealtimeClientProtocol = get_client(
+            llm_config=llm_config, logger=self.logger, **client_kwargs
+        )
+
+        self._registered_realtime_tools: dict[str, Tool] = {}
+        self._observers: list[RealtimeObserver] = observers if observers else []
+        self._observers.append(FunctionObserver(logger=logger))
+        if audio_adapter:
+            self._observers.append(audio_adapter)
+
+        self.callbacks = RealtimeAgentCallbacks()
+
+    @property
+    def system_message(self) -> str:
+        """Get the system message for the agent."""
+        return self._system_message
+
+    @property
+    def logger(self) -> Logger:
+        """Get the logger for the agent."""
+        return self._logger or global_logger
+
+    @property
+    def realtime_client(self) -> RealtimeClientProtocol:
+        """Get the OpenAI Realtime Client."""
+        return self._realtime_client
+
+    @property
+    def registered_realtime_tools(self) -> dict[str, Tool]:
+        """Get the registered realtime tools."""
+        return self._registered_realtime_tools
+
+    def register_observer(self, observer: RealtimeObserver) -> None:
+        """Register an observer with the Realtime Agent.
+
+        Args:
+            observer (RealtimeObserver): The observer to register.
+        """
+        self._observers.append(observer)
+
+    async def start_observers(self) -> None:
+        for observer in self._observers:
+            self._tg.soonify(observer.run)(self)
+
+        # wait for the observers to be ready
+        for observer in self._observers:
+            await observer.wait_for_ready()
+
+        await self.callbacks.on_observers_ready()
+
+    async def run(self) -> None:
+        """Run the agent."""
+        # everything is run in the same task group to enable easy cancellation using self._tg.cancel_scope.cancel()
+        async with create_task_group() as self._tg:  # noqa: SIM117
+            # connect with the client first (establishes a connection and initializes a session)
+            async with self._realtime_client.connect():
+                # start the observers and wait for them to be ready
+                await self.realtime_client.session_update(session_options={"instructions": self.system_message})
+                await self.start_observers()
+
+                # iterate over the events
+                async for event in self.realtime_client.read_events():
+                    for observer in self._observers:
+                        await observer.on_event(event)
+
+    def register_realtime_function(
+        self,
+        *,
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+    ) -> Callable[[Union[F, Tool]], Tool]:
+        """Decorator for registering a function to be used by an agent.
+
+        Args:
+            name (str): The name of the function.
+            description (str): The description of the function.
+
+        Returns:
+            Callable[[Union[F, Tool]], Tool]: The decorator for registering a function.
+        """
+
+        def _decorator(func_or_tool: Union[F, Tool]) -> Tool:
+            """Decorator for registering a function to be used by an agent.
+
+            Args:
+                func_or_tool (Union[F, Tool]): The function or tool to register.
+
+            Returns:
+                Tool: The registered tool.
+            """
+            tool = Tool(func_or_tool=func_or_tool, name=name, description=description)
+
+            self._registered_realtime_tools[tool.name] = tool
+
+            return tool
+
+        return _decorator
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_events.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_events.py
new file mode 100644
index 0000000..a94f8b3
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_events.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Literal
+
+from pydantic import BaseModel
+
+
+class RealtimeEvent(BaseModel):
+    raw_message: dict[str, Any]
+
+
+class SessionCreated(RealtimeEvent):
+    type: Literal["session.created"] = "session.created"
+
+
+class SessionUpdated(RealtimeEvent):
+    type: Literal["session.updated"] = "session.updated"
+
+
+class AudioDelta(RealtimeEvent):
+    type: Literal["response.audio.delta"] = "response.audio.delta"
+    delta: str
+    item_id: Any
+
+
+class InputAudioBufferDelta(RealtimeEvent):
+    type: Literal["input_audio_buffer.delta"] = "input_audio_buffer.delta"
+    delta: str
+    item_id: Any
+
+
+class SpeechStarted(RealtimeEvent):
+    type: Literal["input_audio_buffer.speech_started"] = "input_audio_buffer.speech_started"
+
+
+class FunctionCall(RealtimeEvent):
+    type: Literal["response.function_call_arguments.done"] = "response.function_call_arguments.done"
+    name: str
+    arguments: dict[str, Any]
+    call_id: str
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_observer.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_observer.py
new file mode 100644
index 0000000..ca6890b
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_observer.py
@@ -0,0 +1,100 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from abc import ABC, abstractmethod
+from logging import Logger, getLogger
+from typing import TYPE_CHECKING, Optional
+
+from anyio import Event
+
+from ....doc_utils import export_module
+from .clients.realtime_client import RealtimeClientProtocol
+from .realtime_events import RealtimeEvent
+
+if TYPE_CHECKING:
+    from .realtime_agent import RealtimeAgent
+
+__all__ = ["RealtimeObserver"]
+
+global_logger = getLogger(__name__)
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+class RealtimeObserver(ABC):
+    """Observer for the OpenAI Realtime API."""
+
+    def __init__(self, *, logger: Optional[Logger] = None) -> None:
+        """Observer for the OpenAI Realtime API.
+
+        Args:
+            logger (Logger): The logger for the observer.
+        """
+        self._ready_event = Event()
+        self._agent: Optional[RealtimeAgent] = None
+        self._logger = logger
+
+    @property
+    def logger(self) -> Logger:
+        return self._logger or global_logger
+
+    @property
+    def agent(self) -> "RealtimeAgent":
+        if self._agent is None:
+            raise RuntimeError("Agent has not been set.")
+        return self._agent
+
+    @property
+    def realtime_client(self) -> RealtimeClientProtocol:
+        if self._agent is None:
+            raise RuntimeError("Agent has not been set.")
+        if self._agent.realtime_client is None:
+            raise RuntimeError("Realtime client has not been set.")
+
+        return self._agent.realtime_client
+
+    async def run(self, agent: "RealtimeAgent") -> None:
+        """Run the observer with the agent.
+
+        When implementing, be sure to call `self._ready_event.set()` when the observer is ready to process events.
+
+        Args:
+            agent (RealtimeAgent): The realtime agent attached to the observer.
+        """
+        self._agent = agent
+        await self.initialize_session()
+        self._ready_event.set()
+
+        await self.run_loop()
+
+    @abstractmethod
+    async def run_loop(self) -> None:
+        """Run the loop if needed.
+
+        This method is called after the observer is ready to process events.
+        Events will be processed by the on_event method, this is just a hook for additional processing.
+        Use initialize_session to set up the session.
+        """
+        ...
+
+    @abstractmethod
+    async def initialize_session(self) -> None:
+        """Initialize the session for the observer."""
+        ...
+
+    async def wait_for_ready(self) -> None:
+        """Get the event that is set when the observer is ready."""
+        await self._ready_event.wait()
+
+    @abstractmethod
+    async def on_event(self, event: RealtimeEvent) -> None:
+        """Handle an event from the OpenAI Realtime API.
+
+        Args:
+            event (RealtimeServerEvent): The event from the OpenAI Realtime API.
+        """
+        ...
+
+    async def on_close(self) -> None:
+        """Handle close of RealtimeClient."""
+        ...
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_swarm.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_swarm.py
new file mode 100644
index 0000000..ca7f2c3
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/realtime_swarm.py
@@ -0,0 +1,483 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import logging
+import warnings
+from collections import defaultdict
+from typing import TYPE_CHECKING, Any, Callable, Optional, TypeVar, Union
+
+import anyio
+from asyncer import asyncify, create_task_group, syncify
+
+from ....agentchat.contrib.swarm_agent import AfterWorkOption, initiate_swarm_chat
+from ....cache import AbstractCache
+from ....code_utils import content_str
+from ....doc_utils import export_module
+from ... import Agent, ChatResult, ConversableAgent, LLMAgent
+from ...utils import consolidate_chat_info, gather_usage_summary
+
+if TYPE_CHECKING:
+    from .clients import Role
+    from .realtime_agent import RealtimeAgent
+
+__all__ = ["register_swarm"]
+
+SWARM_SYSTEM_MESSAGE = (
+    "You are a helpful voice assistant. Your task is to listen to user and to coordinate the tasks based on his/her inputs."
+    "You can and will communicate using audio output only."
+)
+
+QUESTION_ROLE: "Role" = "user"
+QUESTION_MESSAGE = (
+    "I have a question/information for myself. DO NOT ANSWER YOURSELF, GET THE ANSWER FROM ME. "
+    "repeat the question to me **WITH AUDIO OUTPUT** and AFTER YOU GET THE ANSWER FROM ME call 'answer_task_question' with the answer in first person\n\n"
+    "IMPORTANT: repeat just the question, without any additional information or context\n\n"
+    "The question is: '{}'\n\n"
+)
+QUESTION_TIMEOUT_SECONDS = 20
+
+logger = logging.getLogger(__name__)
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+def message_to_dict(message: Union[dict[str, Any], str]) -> dict[str, Any]:
+    if isinstance(message, str):
+        return {"content": message}
+    elif isinstance(message, dict):
+        return message
+    else:
+        return dict(message)
+
+
+def parse_oai_message(message: Union[dict[str, Any], str], role: str, adressee: Agent) -> dict[str, Any]:
+    """
+    Parse a message into an OpenAI-compatible message format.
+
+    Args:
+        message: The message to parse.
+        role: The role associated with the message.
+        adressee: The agent that will receive the message.
+
+    Returns:
+        The parsed message in OpenAI-compatible format.
+
+    Raises:
+        ValueError: If the message lacks required fields like 'content', 'function_call', or 'tool_calls'.
+    """
+    message = message_to_dict(message)
+
+    # Extract relevant fields while ensuring none are None
+    oai_message = {
+        key: message[key]
+        for key in ("content", "function_call", "tool_calls", "tool_responses", "tool_call_id", "name", "context")
+        if key in message and message[key] is not None
+    }
+
+    # Validate or set the content field
+    if "content" not in oai_message:
+        if "function_call" in oai_message or "tool_calls" in oai_message:
+            oai_message["content"] = None
+        else:
+            raise ValueError("Message must have either 'content', 'function_call', or 'tool_calls' field.")
+
+    # Determine and assign the role
+    if message.get("role") in ["function", "tool"]:
+        oai_message["role"] = message["role"]
+        # Ensure all tool responses have string content
+        for tool_response in oai_message.get("tool_responses", []):
+            tool_response["content"] = str(tool_response["content"])
+    elif "override_role" in message:
+        oai_message["role"] = message["override_role"]
+    else:
+        oai_message["role"] = role
+
+    # Enforce specific role requirements for assistant messages
+    if oai_message.get("function_call") or oai_message.get("tool_calls"):
+        oai_message["role"] = "assistant"
+
+    # Add a name field if missing
+    if "name" not in oai_message:
+        oai_message["name"] = adressee.name
+
+    return oai_message
+
+
+class SwarmableAgent(Agent):
+    """A class for an agent that can participate in a swarm chat."""
+
+    def __init__(
+        self,
+        name: str,
+        system_message: str = "You are a helpful AI Assistant.",
+        is_termination_msg: Optional[Callable[..., bool]] = None,
+        description: Optional[str] = None,
+        silent: Optional[bool] = None,
+    ):
+        self._oai_messages: dict[Agent, Any] = defaultdict(list)
+
+        self._system_message = system_message
+        self._description = description if description is not None else system_message
+        self._is_termination_msg = (
+            is_termination_msg
+            if is_termination_msg is not None
+            else (lambda x: content_str(x.get("content")) == "TERMINATE")
+        )
+        self.silent = silent
+
+        self._name = name
+
+        # Initialize standalone client cache object.
+        self.client_cache = None
+        self.previous_cache = None
+
+        self.reply_at_receive: dict[Agent, bool] = defaultdict(bool)
+
+    @property
+    def system_message(self) -> str:
+        return self._system_message
+
+    def update_system_message(self, system_message: str) -> None:
+        """Update this agent's system message.
+
+        Args:
+            system_message (str): system message for inference.
+        """
+        self._system_message = system_message
+
+    @property
+    def name(self) -> str:
+        return self._name
+
+    @property
+    def description(self) -> str:
+        return self._description
+
+    def send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ) -> None:
+        self._oai_messages[recipient].append(parse_oai_message(message, "assistant", recipient))
+        recipient.receive(message, self, request_reply)
+
+    def receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: Agent,
+        request_reply: Optional[bool] = None,
+        silent: Optional[bool] = False,
+    ) -> None:
+        self._oai_messages[sender].append(parse_oai_message(message, "user", self))
+        if request_reply is False or (request_reply is None and self.reply_at_receive[sender] is False):
+            return
+        reply = self.generate_reply(messages=self.chat_messages[sender], sender=sender)
+        if reply is not None:
+            self.send(reply, sender, silent=silent)
+
+    def generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Union[str, dict[str, Any], None]:
+        if messages is None:
+            if sender is None:
+                raise ValueError("Either messages or sender must be provided.")
+            messages = self._oai_messages[sender]
+
+        _, reply = self.check_termination_and_human_reply(messages=messages, sender=sender, config=None)
+
+        return reply
+
+    def check_termination_and_human_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Union[str, None]]:
+        raise NotImplementedError
+
+    def initiate_chat(
+        self,
+        recipient: ConversableAgent,
+        message: Union[dict[str, Any], str],
+        clear_history: bool = True,
+        silent: Optional[bool] = False,
+        cache: Optional[AbstractCache] = None,
+        summary_args: Optional[dict[str, Any]] = {},
+        **kwargs: dict[str, Any],
+    ) -> ChatResult:
+        _chat_info = locals().copy()
+        _chat_info["sender"] = self
+        consolidate_chat_info(_chat_info, uniform_sender=self)
+        recipient._raise_exception_on_async_reply_functions()
+        recipient.previous_cache = recipient.client_cache  # type: ignore[attr-defined]
+        recipient.client_cache = cache  # type: ignore[attr-defined, assignment]
+
+        self._prepare_chat(recipient, clear_history)
+        self.send(message, recipient, silent=silent)
+        summary = self._last_msg_as_summary(self, recipient, summary_args)
+
+        recipient.client_cache = recipient.previous_cache  # type: ignore[attr-defined]
+        recipient.previous_cache = None  # type: ignore[attr-defined]
+
+        chat_result = ChatResult(
+            chat_history=self.chat_messages[recipient],
+            summary=summary,
+            cost=gather_usage_summary([self, recipient]),  # type: ignore[arg-type]
+            human_input=[],
+        )
+        return chat_result
+
+    async def a_generate_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional["Agent"] = None,
+        **kwargs: Any,
+    ) -> Union[str, dict[str, Any], None]:
+        return self.generate_reply(messages=messages, sender=sender, **kwargs)
+
+    async def a_receive(
+        self,
+        message: Union[dict[str, Any], str],
+        sender: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        self.receive(message, sender, request_reply)
+
+    async def a_send(
+        self,
+        message: Union[dict[str, Any], str],
+        recipient: "Agent",
+        request_reply: Optional[bool] = None,
+    ) -> None:
+        self.send(message, recipient, request_reply)
+
+    @property
+    def chat_messages(self) -> dict[Agent, list[dict[str, Any]]]:
+        """A dictionary of conversations from agent to list of messages."""
+        return self._oai_messages
+
+    def last_message(self, agent: Optional[Agent] = None) -> Optional[dict[str, Any]]:
+        if agent is None:
+            n_conversations = len(self._oai_messages)
+            if n_conversations == 0:
+                return None
+            if n_conversations == 1:
+                for conversation in self._oai_messages.values():
+                    return conversation[-1]  # type: ignore[no-any-return]
+            raise ValueError("More than one conversation is found. Please specify the sender to get the last message.")
+        if agent not in self._oai_messages():
+            raise KeyError(
+                f"The agent '{agent.name}' is not present in any conversation. No history available for this agent."
+            )
+        return self._oai_messages[agent][-1]  # type: ignore[no-any-return]
+
+    def _prepare_chat(
+        self,
+        recipient: ConversableAgent,
+        clear_history: bool,
+        prepare_recipient: bool = True,
+        reply_at_receive: bool = True,
+    ) -> None:
+        self.reply_at_receive[recipient] = reply_at_receive
+        if clear_history:
+            self._oai_messages[recipient].clear()
+        if prepare_recipient:
+            recipient._prepare_chat(self, clear_history, False, reply_at_receive)  # type: ignore[arg-type]
+
+    def _raise_exception_on_async_reply_functions(self) -> None:
+        pass
+
+    def set_ui_tools(self, tools: Optional[list] = None) -> None:
+        """Set UI tools for the agent."""
+        pass
+
+    def unset_ui_tools(self) -> None:
+        """Unset UI tools for the agent."""
+        pass
+
+    @staticmethod
+    def _last_msg_as_summary(sender: Agent, recipient: Agent, summary_args: Optional[dict[str, Any]]) -> str:
+        """Get a chat summary from the last message of the recipient."""
+        summary = ""
+        try:
+            content = recipient.last_message(sender)["content"]  # type: ignore[attr-defined]
+            if isinstance(content, str):
+                summary = content.replace("TERMINATE", "")
+            elif isinstance(content, list):
+                summary = "\n".join(
+                    x["text"].replace("TERMINATE", "") for x in content if isinstance(x, dict) and "text" in x
+                )
+        except (IndexError, AttributeError) as e:
+            warnings.warn(f"Cannot extract summary using last_msg: {e}. Using an empty str as summary.", UserWarning)
+        return summary
+
+
+# check that the SwarmableAgent class is implementing LLMAgent protocol
+if TYPE_CHECKING:
+
+    def _create_swarmable_agent(
+        name: str,
+        system_message: str,
+        is_termination_msg: Optional[Callable[..., bool]],
+        description: Optional[str],
+        silent: Optional[bool],
+    ) -> LLMAgent:
+        return SwarmableAgent(
+            name=name,
+            system_message=system_message,
+            is_termination_msg=is_termination_msg,
+            description=description,
+            silent=silent,
+        )
+
+
+class SwarmableRealtimeAgent(SwarmableAgent):
+    def __init__(
+        self,
+        realtime_agent: "RealtimeAgent",
+        initial_agent: ConversableAgent,
+        agents: list[ConversableAgent],
+        question_message: Optional[str] = None,
+    ) -> None:
+        self._initial_agent = initial_agent
+        self._agents = agents
+        self._realtime_agent = realtime_agent
+
+        self._answer_event: anyio.Event = anyio.Event()
+        self._answer: str = ""
+        self.question_message = question_message or QUESTION_MESSAGE
+
+        super().__init__(
+            name=realtime_agent._name,
+            is_termination_msg=None,
+            description=None,
+            silent=None,
+        )
+
+    def reset_answer(self) -> None:
+        """Reset the answer event."""
+        self._answer_event = anyio.Event()
+
+    def set_answer(self, answer: str) -> str:
+        """Set the answer to the question."""
+        self._answer = answer
+        self._answer_event.set()
+        return "Answer set successfully."
+
+    async def get_answer(self) -> str:
+        """Get the answer to the question."""
+        await self._answer_event.wait()
+        return self._answer
+
+    async def ask_question(self, question: str, question_timeout: int) -> None:
+        """Send a question for the user to the agent and wait for the answer.
+        If the answer is not received within the timeout, the question is repeated.
+
+        Args:
+            question: The question to ask the user.
+            question_timeout: The time in seconds to wait for the answer.
+        """
+        self.reset_answer()
+        realtime_client = self._realtime_agent._realtime_client
+        await realtime_client.send_text(role=QUESTION_ROLE, text=question)
+
+        async def _check_event_set(timeout: int = question_timeout) -> bool:
+            for _ in range(timeout):
+                if self._answer_event.is_set():
+                    return True
+                await anyio.sleep(1)
+            return False
+
+        while not await _check_event_set():
+            await realtime_client.send_text(role=QUESTION_ROLE, text=question)
+
+    def check_termination_and_human_reply(
+        self,
+        messages: Optional[list[dict[str, Any]]] = None,
+        sender: Optional[Agent] = None,
+        config: Optional[Any] = None,
+    ) -> tuple[bool, Optional[str]]:
+        """Check if the conversation should be terminated and if the agent should reply.
+
+        Called when its agents turn in the chat conversation.
+
+        Args:
+            messages (list[dict[str, Any]]): The messages in the conversation.
+            sender (Agent): The agent that sent the message.
+            config (Optional[Any]): The configuration for the agent.
+        """
+        if not messages:
+            return False, None
+
+        async def get_input() -> None:
+            async with create_task_group() as tg:
+                tg.soonify(self.ask_question)(
+                    self.question_message.format(messages[-1]["content"]),
+                    question_timeout=QUESTION_TIMEOUT_SECONDS,
+                )
+
+        syncify(get_input)()
+
+        return True, {"role": "user", "content": self._answer}  # type: ignore[return-value]
+
+    def start_chat(self) -> None:
+        raise NotImplementedError
+
+    def configure_realtime_agent(self, system_message: Optional[str]) -> None:
+        realtime_agent = self._realtime_agent
+
+        logger = realtime_agent.logger
+        if not system_message:
+            if realtime_agent.system_message != "You are a helpful AI Assistant.":
+                logger.warning(
+                    "Overriding system message set up in `__init__`, please use `system_message` parameter of the `register_swarm` function instead."
+                )
+            system_message = SWARM_SYSTEM_MESSAGE
+
+        realtime_agent._system_message = system_message
+
+        realtime_agent.register_realtime_function(
+            name="answer_task_question", description="Answer question from the task"
+        )(self.set_answer)
+
+        async def on_observers_ready() -> None:
+            self._realtime_agent._tg.soonify(asyncify(initiate_swarm_chat))(
+                initial_agent=self._initial_agent,
+                agents=self._agents,
+                user_agent=self,  # type: ignore[arg-type]
+                messages="Find out what the user wants.",
+                after_work=AfterWorkOption.REVERT_TO_USER,
+            )
+
+        self._realtime_agent.callbacks.on_observers_ready = on_observers_ready
+
+
+@export_module("autogen.agentchat.realtime.experimental")
+def register_swarm(
+    *,
+    realtime_agent: "RealtimeAgent",
+    initial_agent: ConversableAgent,
+    agents: list[ConversableAgent],
+    system_message: Optional[str] = None,
+    question_message: Optional[str] = None,
+) -> None:
+    """Create a SwarmableRealtimeAgent.
+
+    Args:
+        realtime_agent (RealtimeAgent): The RealtimeAgent to create the SwarmableRealtimeAgent from.
+        initial_agent (ConversableAgent): The initial agent.
+        agents (list[ConversableAgent]): The agents in the swarm.
+        system_message (Optional[str]): The system message to set for the agent. If None, the default system message is used.
+        question_message (Optional[str]): The question message to set for the agent. If None, the default QUESTION_MESSAGE is used.
+    """
+    swarmable_agent = SwarmableRealtimeAgent(
+        realtime_agent=realtime_agent, initial_agent=initial_agent, agents=agents, question_message=question_message
+    )
+
+    swarmable_agent.configure_realtime_agent(system_message=system_message)
diff --git a/mm_agents/coact/autogen/agentchat/realtime/experimental/websockets.py b/mm_agents/coact/autogen/agentchat/realtime/experimental/websockets.py
new file mode 100644
index 0000000..e5ab408
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime/experimental/websockets.py
@@ -0,0 +1,21 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from collections.abc import AsyncIterator
+from typing import Any, Protocol, runtime_checkable
+
+__all__ = ["WebSocketProtocol"]
+
+
+@runtime_checkable
+class WebSocketProtocol(Protocol):
+    """WebSocket protocol for sending and receiving JSON data modelled after FastAPI's WebSocket."""
+
+    async def send_json(self, data: Any, mode: str = "text") -> None: ...
+
+    async def receive_json(self, mode: str = "text") -> Any: ...
+
+    async def receive_text(self) -> str: ...
+
+    def iter_text(self) -> AsyncIterator[str]: ...
diff --git a/mm_agents/coact/autogen/agentchat/realtime_agent/__init__.py b/mm_agents/coact/autogen/agentchat/realtime_agent/__init__.py
new file mode 100644
index 0000000..6e14b66
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/realtime_agent/__init__.py
@@ -0,0 +1,21 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from ..realtime.experimental import (
+    FunctionObserver,
+    RealtimeAgent,
+    RealtimeObserver,
+    TwilioAudioAdapter,
+    WebSocketAudioAdapter,
+    register_swarm,
+)
+
+__all__ = [
+    "FunctionObserver",
+    "RealtimeAgent",
+    "RealtimeObserver",
+    "TwilioAudioAdapter",
+    "WebSocketAudioAdapter",
+    "register_swarm",
+]
diff --git a/mm_agents/coact/autogen/agentchat/user_proxy_agent.py b/mm_agents/coact/autogen/agentchat/user_proxy_agent.py
new file mode 100644
index 0000000..134a74b
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/user_proxy_agent.py
@@ -0,0 +1,111 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import Any, Callable, Literal, Optional, Union
+
+from ..doc_utils import export_module
+from ..llm_config import LLMConfig
+from ..runtime_logging import log_new_agent, logging_enabled
+from .conversable_agent import ConversableAgent
+
+
+@export_module("autogen")
+class UserProxyAgent(ConversableAgent):
+    """(In preview) A proxy agent for the user, that can execute code and provide feedback to the other agents.
+
+    UserProxyAgent is a subclass of ConversableAgent configured with `human_input_mode` to ALWAYS
+    and `llm_config` to False. By default, the agent will prompt for human input every time a message is received.
+    Code execution is enabled by default. LLM-based auto reply is disabled by default.
+    To modify auto reply, register a method with [`register_reply`](../ConversableAgent#register-reply).
+    To modify the way to get human input, override `get_human_input` method.
+    To modify the way to execute code blocks, single code block, or function call, override `execute_code_blocks`,
+    `run_code`, and `execute_function` methods respectively.
+    """
+
+    # Default UserProxyAgent.description values, based on human_input_mode
+    DEFAULT_USER_PROXY_AGENT_DESCRIPTIONS = {
+        "ALWAYS": "An attentive HUMAN user who can answer questions about the task, and can perform tasks such as running Python code or inputting command line commands at a Linux terminal and reporting back the execution results.",
+        "TERMINATE": "A user that can run Python code or input command line commands at a Linux terminal and report back the execution results.",
+        "NEVER": "A computer terminal that performs no other action than running Python scripts (provided to it quoted in ```python code blocks), or sh shell scripts (provided to it quoted in ```sh code blocks).",
+    }
+
+    def __init__(
+        self,
+        name: str,
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        human_input_mode: Literal["ALWAYS", "TERMINATE", "NEVER"] = "ALWAYS",
+        function_map: Optional[dict[str, Callable[..., Any]]] = None,
+        code_execution_config: Union[dict[str, Any], Literal[False]] = {},
+        default_auto_reply: Optional[Union[str, dict[str, Any]]] = "",
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = False,
+        system_message: Optional[Union[str, list[str]]] = "",
+        description: Optional[str] = None,
+        **kwargs: Any,
+    ):
+        """Args:
+        name (str): name of the agent.
+        is_termination_msg (function): a function that takes a message in the form of a dictionary
+            and returns a boolean value indicating if this received message is a termination message.
+            The dict can contain the following keys: "content", "role", "name", "function_call".
+        max_consecutive_auto_reply (int): the maximum number of consecutive auto replies.
+            default to None (no limit provided, class attribute MAX_CONSECUTIVE_AUTO_REPLY will be used as the limit in this case).
+            The limit only plays a role when human_input_mode is not "ALWAYS".
+        human_input_mode (str): whether to ask for human inputs every time a message is received.
+            Possible values are "ALWAYS", "TERMINATE", "NEVER".
+            (1) When "ALWAYS", the agent prompts for human input every time a message is received.
+                Under this mode, the conversation stops when the human input is "exit",
+                or when is_termination_msg is True and there is no human input.
+            (2) When "TERMINATE", the agent only prompts for human input only when a termination message is received or
+                the number of auto reply reaches the max_consecutive_auto_reply.
+            (3) When "NEVER", the agent will never prompt for human input. Under this mode, the conversation stops
+                when the number of auto reply reaches the max_consecutive_auto_reply or when is_termination_msg is True.
+        function_map (dict[str, callable]): Mapping function names (passed to openai) to callable functions.
+        code_execution_config (dict or False): config for the code execution.
+            To disable code execution, set to False. Otherwise, set to a dictionary with the following keys:
+            - work_dir (Optional, str): The working directory for the code execution.
+                If None, a default working directory will be used.
+                The default working directory is the "extensions" directory under
+                "path_to_autogen".
+            - use_docker (Optional, list, str or bool): The docker image to use for code execution.
+                Default is True, which means the code will be executed in a docker container. A default list of images will be used.
+                If a list or a str of image name(s) is provided, the code will be executed in a docker container
+                with the first image successfully pulled.
+                If False, the code will be executed in the current environment.
+                We strongly recommend using docker for code execution.
+            - timeout (Optional, int): The maximum execution time in seconds.
+            - last_n_messages (Experimental, Optional, int): The number of messages to look back for code execution. Default to 1.
+        default_auto_reply (str or dict or None): the default auto reply message when no code execution or llm based reply is generated.
+        llm_config (LLMConfig or dict or False or None): llm inference configuration.
+            Please refer to [OpenAIWrapper.create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create)
+            for available options.
+            Default to False, which disables llm-based auto reply.
+            When set to None, will use self.DEFAULT_CONFIG, which defaults to False.
+        system_message (str or List): system message for ChatCompletion inference.
+            Only used when llm_config is not False. Use it to reprogram the agent.
+        description (str): a short description of the agent. This description is used by other agents
+            (e.g. the GroupChatManager) to decide when to call upon this agent. (Default: system_message)
+        **kwargs (dict): Please refer to other kwargs in
+            [ConversableAgent](https://docs.ag2.ai/latest/docs/api-reference/autogen/ConversableAgent).
+        """
+        super().__init__(
+            name=name,
+            system_message=system_message,
+            is_termination_msg=is_termination_msg,
+            max_consecutive_auto_reply=max_consecutive_auto_reply,
+            human_input_mode=human_input_mode,
+            function_map=function_map,
+            code_execution_config=code_execution_config,
+            llm_config=llm_config,
+            default_auto_reply=default_auto_reply,
+            description=(
+                description if description is not None else self.DEFAULT_USER_PROXY_AGENT_DESCRIPTIONS[human_input_mode]
+            ),
+            **kwargs,
+        )
+
+        if logging_enabled():
+            log_new_agent(self, locals())
diff --git a/mm_agents/coact/autogen/agentchat/utils.py b/mm_agents/coact/autogen/agentchat/utils.py
new file mode 100644
index 0000000..d2784bc
--- /dev/null
+++ b/mm_agents/coact/autogen/agentchat/utils.py
@@ -0,0 +1,206 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import re
+from typing import Any, Optional, Union
+
+from ..doc_utils import export_module
+from .agent import Agent
+
+
+def consolidate_chat_info(
+    chat_info: Union[dict[str, Any], list[dict[str, Any]]], uniform_sender: Optional[Agent] = None
+) -> None:
+    if isinstance(chat_info, dict):
+        chat_info = [chat_info]
+    for c in chat_info:
+        if uniform_sender is None:
+            assert "sender" in c, "sender must be provided."
+            sender = c["sender"]
+        else:
+            sender = uniform_sender
+        assert "recipient" in c, "recipient must be provided."
+        summary_method = c.get("summary_method")
+        assert (
+            summary_method is None or callable(summary_method) or summary_method in ("last_msg", "reflection_with_llm")
+        ), "summary_method must be a string chosen from 'reflection_with_llm' or 'last_msg' or a callable, or None."
+        if summary_method == "reflection_with_llm":
+            assert sender.client is not None or c["recipient"].client is not None, (
+                "llm client must be set in either the recipient or sender when summary_method is reflection_with_llm."
+            )
+
+
+@export_module("autogen")
+def gather_usage_summary(agents: list[Agent]) -> dict[str, dict[str, Any]]:
+    r"""Gather usage summary from all agents.
+
+    Args:
+        agents: (list): List of agents.
+
+    Returns:
+        dictionary: A dictionary containing two keys:
+            - "usage_including_cached_inference": Cost information on the total usage, including the tokens in cached inference.
+            - "usage_excluding_cached_inference": Cost information on the usage of tokens, excluding the tokens in cache. No larger than "usage_including_cached_inference".
+
+    Example:
+    ```python
+    {
+        "usage_including_cached_inference": {
+            "total_cost": 0.0006090000000000001,
+            "gpt-35-turbo": {
+                "cost": 0.0006090000000000001,
+                "prompt_tokens": 242,
+                "completion_tokens": 123,
+                "total_tokens": 365,
+            },
+        },
+        "usage_excluding_cached_inference": {
+            "total_cost": 0.0006090000000000001,
+            "gpt-35-turbo": {
+                "cost": 0.0006090000000000001,
+                "prompt_tokens": 242,
+                "completion_tokens": 123,
+                "total_tokens": 365,
+            },
+        },
+    }
+    ```
+
+    Note:
+    If none of the agents incurred any cost (not having a client), then the usage_including_cached_inference and usage_excluding_cached_inference will be `{'total_cost': 0}`.
+    """
+
+    def aggregate_summary(usage_summary: dict[str, Any], agent_summary: dict[str, Any]) -> None:
+        if agent_summary is None:
+            return
+        usage_summary["total_cost"] += agent_summary.get("total_cost", 0)
+        for model, data in agent_summary.items():
+            if model != "total_cost":
+                if model not in usage_summary:
+                    usage_summary[model] = data.copy()
+                else:
+                    usage_summary[model]["cost"] += data.get("cost", 0)
+                    usage_summary[model]["prompt_tokens"] += data.get("prompt_tokens", 0)
+                    usage_summary[model]["completion_tokens"] += data.get("completion_tokens", 0)
+                    usage_summary[model]["total_tokens"] += data.get("total_tokens", 0)
+
+    usage_including_cached_inference = {"total_cost": 0}
+    usage_excluding_cached_inference = {"total_cost": 0}
+
+    for agent in agents:
+        if getattr(agent, "client", None):
+            aggregate_summary(usage_including_cached_inference, agent.client.total_usage_summary)  # type: ignore[attr-defined]
+            aggregate_summary(usage_excluding_cached_inference, agent.client.actual_usage_summary)  # type: ignore[attr-defined]
+
+    return {
+        "usage_including_cached_inference": usage_including_cached_inference,
+        "usage_excluding_cached_inference": usage_excluding_cached_inference,
+    }
+
+
+def parse_tags_from_content(tag: str, content: Union[str, list[dict[str, Any]]]) -> list[dict[str, Any]]:
+    """Parses HTML style tags from message contents.
+
+    The parsing is done by looking for patterns in the text that match the format of HTML tags. The tag to be parsed is
+    specified as an argument to the function. The function looks for this tag in the text and extracts its content. The
+    content of a tag is everything that is inside the tag, between the opening and closing angle brackets. The content
+    can be a single string or a set of attribute-value pairs.
+
+    Examples:
+        `<img http://example.com/image.png> -> [{"tag": "img", "attr": {"src": "http://example.com/image.png"}, "match": re.Match}]`
+        ```<audio text="Hello I'm a robot" prompt="whisper"> ->
+                [{"tag": "audio", "attr": {"text": "Hello I'm a robot", "prompt": "whisper"}, "match": re.Match}]```
+
+    Args:
+        tag (str): The HTML style tag to be parsed.
+        content (Union[str, list[dict[str, Any]]]): The message content to parse. Can be a string or a list of content
+            items.
+
+    Returns:
+        list[dict[str, str]]: A list of dictionaries, where each dictionary represents a parsed tag. Each dictionary
+            contains three key-value pairs: 'type' which is the tag, 'attr' which is a dictionary of the parsed attributes,
+            and 'match' which is a regular expression match object.
+
+    Raises:
+        ValueError: If the content is not a string or a list.
+    """
+    results = []
+    if isinstance(content, str):
+        results.extend(_parse_tags_from_text(tag, content))
+    # Handles case for multimodal messages.
+    elif isinstance(content, list):
+        for item in content:
+            if item.get("type") == "text":
+                results.extend(_parse_tags_from_text(tag, item["text"]))
+    else:
+        raise ValueError(f"content must be str or list, but got {type(content)}")
+
+    return results
+
+
+def _parse_tags_from_text(tag: str, text: str) -> list[dict[str, Any]]:
+    pattern = re.compile(f"<{tag} (.*?)>")
+
+    results = []
+    for match in re.finditer(pattern, text):
+        tag_attr = match.group(1).strip()
+        attr = _parse_attributes_from_tags(tag_attr)
+
+        results.append({"tag": tag, "attr": attr, "match": match})
+    return results
+
+
+def _parse_attributes_from_tags(tag_content: str) -> dict[str, str]:
+    pattern = r"([^ ]+)"
+    attrs = re.findall(pattern, tag_content)
+    reconstructed_attrs = _reconstruct_attributes(attrs)
+
+    def _append_src_value(content: dict[str, str], value: Any) -> None:
+        if "src" in content:
+            content["src"] += f" {value}"
+        else:
+            content["src"] = value
+
+    content: dict[str, str] = {}
+    for attr in reconstructed_attrs:
+        if "=" not in attr:
+            _append_src_value(content, attr)
+            continue
+
+        key, value = attr.split("=", 1)
+        if value.startswith("'") or value.startswith('"'):
+            content[key] = value[1:-1]  # remove quotes
+        else:
+            _append_src_value(content, attr)
+
+    return content
+
+
+def _reconstruct_attributes(attrs: list[str]) -> list[str]:
+    """Reconstructs attributes from a list of strings where some attributes may be split across multiple elements."""
+
+    def is_attr(attr: str) -> bool:
+        if "=" in attr:
+            _, value = attr.split("=", 1)
+            if value.startswith("'") or value.startswith('"'):
+                return True
+        return False
+
+    reconstructed = []
+    found_attr = False
+    for attr in attrs:
+        if is_attr(attr):
+            reconstructed.append(attr)
+            found_attr = True
+        else:
+            if found_attr:
+                reconstructed[-1] += f" {attr}"
+                found_attr = True
+            elif reconstructed:
+                reconstructed[-1] += f" {attr}"
+            else:
+                reconstructed.append(attr)
+    return reconstructed
diff --git a/mm_agents/coact/autogen/code_utils.py b/mm_agents/coact/autogen/code_utils.py
new file mode 100644
index 0000000..981e23e
--- /dev/null
+++ b/mm_agents/coact/autogen/code_utils.py
@@ -0,0 +1,596 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import logging
+import os
+import pathlib
+import re
+import string
+import subprocess
+import sys
+import time
+import venv
+from concurrent.futures import ThreadPoolExecutor, TimeoutError
+from hashlib import md5
+from types import SimpleNamespace
+from typing import Callable, Optional, Union
+
+import docker
+
+from .types import UserMessageImageContentPart, UserMessageTextContentPart
+
+SENTINEL = object()
+DEFAULT_MODEL = "gpt-4"
+FAST_MODEL = "gpt-3.5-turbo"
+# Regular expression for finding a code block
+# ```[ \t]*(\w+)?[ \t]*\r?\n(.*?)[ \t]*\r?\n``` Matches multi-line code blocks.
+#   The [ \t]* matches the potential spaces before language name.
+#   The (\w+)? matches the language, where the ? indicates it is optional.
+#   The [ \t]* matches the potential spaces (not newlines) after language name.
+#   The \r?\n makes sure there is a linebreak after ```.
+#   The (.*?) matches the code itself (non-greedy).
+#   The \r?\n makes sure there is a linebreak before ```.
+#   The [ \t]* matches the potential spaces before closing ``` (the spec allows indentation).
+CODE_BLOCK_PATTERN = r"```[ \t]*(\w+)?[ \t]*\r?\n(.*?)\r?\n[ \t]*```"
+WORKING_DIR = os.path.join(os.path.dirname(os.path.realpath(__file__)), "extensions")
+UNKNOWN = "unknown"
+TIMEOUT_MSG = "Timeout"
+DEFAULT_TIMEOUT = 600
+WIN32 = sys.platform == "win32"
+PATH_SEPARATOR = (WIN32 and "\\") or "/"
+PYTHON_VARIANTS = ["python", "Python", "py"]
+
+logger = logging.getLogger(__name__)
+
+
+def content_str(content: Union[str, list[Union[UserMessageTextContentPart, UserMessageImageContentPart]], None]) -> str:
+    """Converts the `content` field of an OpenAI message into a string format.
+
+    This function processes content that may be a string, a list of mixed text and image URLs, or None,
+    and converts it into a string. Text is directly appended to the result string, while image URLs are
+    represented by a placeholder image token. If the content is None, an empty string is returned.
+
+    Args:
+        content: The content to be processed. Can be a string, a list of dictionaries representing text and image URLs, or None.
+
+    Returns:
+        str: A string representation of the input content. Image URLs are replaced with an image token.
+
+    Note:
+    - The function expects each dictionary in the list to have a "type" key that is either "text" or "image_url".
+      For "text" type, the "text" key's value is appended to the result. For "image_url", an image token is appended.
+    - This function is useful for handling content that may include both text and image references, especially
+      in contexts where images need to be represented as placeholders.
+    """
+    if content is None:
+        return ""
+    if isinstance(content, str):
+        return content
+    if not isinstance(content, list):
+        raise TypeError(f"content must be None, str, or list, but got {type(content)}")
+
+    rst = ""
+    for item in content:
+        if not isinstance(item, dict):
+            raise TypeError("Wrong content format: every element should be dict if the content is a list.")
+        assert "type" in item, "Wrong content format. Missing 'type' key in content's dict."
+        if item["type"] == "text":
+            rst += item["text"]
+        elif item["type"] in ["input_image", "image_url"]:
+            rst += "<image>"
+        else:
+            raise ValueError(f"Wrong content format: unknown type {item['type']} within the content")
+    return rst
+
+
+def infer_lang(code: str) -> str:
+    """Infer the language for the code.
+    TODO: make it robust.
+    """
+    if code.startswith("python ") or code.startswith("pip") or code.startswith("python3 "):
+        return "sh"
+
+    # check if code is a valid python code
+    try:
+        compile(code, "test", "exec")
+        return "python"
+    except SyntaxError:
+        # not a valid python code
+        return UNKNOWN
+
+
+# TODO: In the future move, to better support https://spec.commonmark.org/0.30/#fenced-code-blocks
+#       perhaps by using a full Markdown parser.
+def extract_code(
+    text: Union[str, list], pattern: str = CODE_BLOCK_PATTERN, detect_single_line_code: bool = False
+) -> list[tuple[str, str]]:
+    """Extract code from a text.
+
+    Args:
+        text (str or List): The content to extract code from. The content can be
+            a string or a list, as returned by standard GPT or multimodal GPT.
+        pattern (str, optional): The regular expression pattern for finding the
+            code block. Defaults to CODE_BLOCK_PATTERN.
+        detect_single_line_code (bool, optional): Enable the new feature for
+            extracting single line code. Defaults to False.
+
+    Returns:
+        list: A list of tuples, each containing the language and the code.
+          If there is no code block in the input text, the language would be "unknown".
+          If there is code block but the language is not specified, the language would be "".
+    """
+    text = content_str(text)
+    if not detect_single_line_code:
+        match = re.findall(pattern, text, flags=re.DOTALL)
+        return match if match else [(UNKNOWN, text)]
+
+    # Extract both multi-line and single-line code block, separated by the | operator
+    # `([^`]+)`: Matches inline code.
+    code_pattern = re.compile(CODE_BLOCK_PATTERN + r"|`([^`]+)`")
+    code_blocks = code_pattern.findall(text)
+
+    # Extract the individual code blocks and languages from the matched groups
+    extracted = []
+    for lang, group1, group2 in code_blocks:
+        if group1:
+            extracted.append((lang.strip(), group1.strip()))
+        elif group2:
+            extracted.append(("", group2.strip()))
+
+    return extracted
+
+
+def timeout_handler(signum, frame):
+    raise TimeoutError("Timed out!")
+
+
+def get_powershell_command():
+    try:
+        result = subprocess.run(["powershell", "$PSVersionTable.PSVersion.Major"], capture_output=True, text=True)
+        if result.returncode == 0:
+            return "powershell"
+    except (FileNotFoundError, NotADirectoryError):
+        # This means that 'powershell' command is not found so now we try looking for 'pwsh'
+        try:
+            result = subprocess.run(
+                ["pwsh", "-Command", "$PSVersionTable.PSVersion.Major"], capture_output=True, text=True
+            )
+            if result.returncode == 0:
+                return "pwsh"
+        except FileExistsError as e:
+            raise FileNotFoundError(
+                "Neither powershell.exe nor pwsh.exe is present in the system. "
+                "Please install PowerShell and try again. "
+            ) from e
+        except NotADirectoryError as e:
+            raise NotADirectoryError(
+                "PowerShell is either not installed or its path is not given "
+                "properly in the environment variable PATH. Please check the "
+                "path and try again. "
+            ) from e
+    except PermissionError as e:
+        raise PermissionError("No permission to run powershell.") from e
+
+
+def _cmd(lang: str) -> str:
+    if lang in PYTHON_VARIANTS:
+        return "python"
+    if lang.startswith("python") or lang in ["bash", "sh"]:
+        return lang
+    if lang in ["shell"]:
+        return "sh"
+    if lang == "javascript":
+        return "node"
+    if lang in ["ps1", "pwsh", "powershell"]:
+        powershell_command = get_powershell_command()
+        return powershell_command
+
+    raise NotImplementedError(f"{lang} not recognized in code execution")
+
+
+def is_docker_running() -> bool:
+    """Check if docker is running.
+
+    Returns:
+        bool: True if docker is running; False otherwise.
+    """
+    try:
+        client = docker.from_env()
+        client.ping()
+        return True
+    except docker.errors.DockerException:
+        return False
+
+
+def in_docker_container() -> bool:
+    """Check if the code is running in a docker container.
+
+    Returns:
+        bool: True if the code is running in a docker container; False otherwise.
+    """
+    return os.path.exists("/.dockerenv")
+
+
+def decide_use_docker(use_docker: Optional[bool]) -> Optional[bool]:
+    if use_docker is None:
+        env_var_use_docker = os.environ.get("AUTOGEN_USE_DOCKER", "True")
+
+        truthy_values = {"1", "true", "yes", "t"}
+        falsy_values = {"0", "false", "no", "f"}
+
+        # Convert the value to lowercase for case-insensitive comparison
+        env_var_use_docker_lower = env_var_use_docker.lower()
+
+        # Determine the boolean value based on the environment variable
+        if env_var_use_docker_lower in truthy_values:
+            use_docker = True
+        elif env_var_use_docker_lower in falsy_values:
+            use_docker = False
+        elif env_var_use_docker_lower == "none":  # Special case for 'None' as a string
+            use_docker = None
+        else:
+            # Raise an error for any unrecognized value
+            raise ValueError(
+                f'Invalid value for AUTOGEN_USE_DOCKER: {env_var_use_docker}. Please set AUTOGEN_USE_DOCKER to "1/True/yes", "0/False/no", or "None".'
+            )
+    return use_docker
+
+
+def check_can_use_docker_or_throw(use_docker) -> None:
+    if use_docker is not None:
+        inside_docker = in_docker_container()
+        docker_installed_and_running = is_docker_running()
+        if use_docker and not inside_docker and not docker_installed_and_running:
+            raise RuntimeError(
+                "Code execution is set to be run in docker (default behaviour) but docker is not running.\n"
+                "The options available are:\n"
+                "- Make sure docker is running (advised approach for code execution)\n"
+                '- Set "use_docker": False in code_execution_config\n'
+                '- Set AUTOGEN_USE_DOCKER to "0/False/no" in your environment variables'
+            )
+
+
+def _sanitize_filename_for_docker_tag(filename: str) -> str:
+    """Convert a filename to a valid docker tag.
+    See https://docs.docker.com/engine/reference/commandline/tag/ for valid tag
+    format.
+
+    Args:
+        filename (str): The filename to be converted.
+
+    Returns:
+        str: The sanitized Docker tag.
+    """
+    # Replace any character not allowed with an underscore
+    allowed_chars = set(string.ascii_letters + string.digits + "_.-")
+    sanitized = "".join(char if char in allowed_chars else "_" for char in filename)
+
+    # Ensure it does not start with a period or a dash
+    if sanitized.startswith(".") or sanitized.startswith("-"):
+        sanitized = "_" + sanitized[1:]
+
+    # Truncate if longer than 128 characters
+    return sanitized[:128]
+
+
+def execute_code(
+    code: Optional[str] = None,
+    timeout: Optional[int] = None,
+    filename: Optional[str] = None,
+    work_dir: Optional[str] = None,
+    use_docker: Union[list[str], str, bool] = SENTINEL,
+    lang: Optional[str] = "python",
+) -> tuple[int, str, Optional[str]]:
+    """Execute code in a docker container.
+    This function is not tested on MacOS.
+
+    Args:
+        code (Optional, str): The code to execute.
+            If None, the code from the file specified by filename will be executed.
+            Either code or filename must be provided.
+        timeout (Optional, int): The maximum execution time in seconds.
+            If None, a default timeout will be used. The default timeout is 600 seconds. On Windows, the timeout is not enforced when use_docker=False.
+        filename (Optional, str): The file name to save the code or where the code is stored when `code` is None.
+            If None, a file with a randomly generated name will be created.
+            The randomly generated file will be deleted after execution.
+            The file name must be a relative path. Relative paths are relative to the working directory.
+        work_dir (Optional, str): The working directory for the code execution.
+            If None, a default working directory will be used.
+            The default working directory is the "extensions" directory under
+            "path_to_autogen".
+        use_docker (list, str or bool): The docker image to use for code execution.
+            Default is True, which means the code will be executed in a docker container. A default list of images will be used.
+            If a list or a str of image name(s) is provided, the code will be executed in a docker container
+            with the first image successfully pulled.
+            If False, the code will be executed in the current environment.
+            Expected behaviour:
+                - If `use_docker` is not set (i.e. left default to True) or is explicitly set to True and the docker package is available, the code will run in a Docker container.
+                - If `use_docker` is not set (i.e. left default to True) or is explicitly set to True but the Docker package is missing or docker isn't running, an error will be raised.
+                - If `use_docker` is explicitly set to False, the code will run natively.
+            If the code is executed in the current environment,
+            the code must be trusted.
+        lang (Optional, str): The language of the code. Default is "python".
+
+    Returns:
+        int: 0 if the code executes successfully.
+        str: The error message if the code fails to execute; the stdout otherwise.
+        image: The docker image name after container run when docker is used.
+    """
+    if all((code is None, filename is None)):
+        error_msg = f"Either {code=} or {filename=} must be provided."
+        logger.error(error_msg)
+        raise AssertionError(error_msg)
+
+    running_inside_docker = in_docker_container()
+    docker_running = is_docker_running()
+
+    # SENTINEL is used to indicate that the user did not explicitly set the argument
+    if use_docker is SENTINEL:
+        use_docker = decide_use_docker(use_docker=None)
+    check_can_use_docker_or_throw(use_docker)
+
+    timeout = timeout or DEFAULT_TIMEOUT
+    original_filename = filename
+    if WIN32 and lang in ["sh", "shell"] and (not use_docker):
+        lang = "ps1"
+    if filename is None:
+        code_hash = md5(code.encode()).hexdigest()
+        # create a file with a automatically generated name
+        filename = f"tmp_code_{code_hash}.{'py' if lang.startswith('python') else lang}"
+    if work_dir is None:
+        work_dir = WORKING_DIR
+
+    filepath = os.path.join(work_dir, filename)
+    file_dir = os.path.dirname(filepath)
+    os.makedirs(file_dir, exist_ok=True)
+
+    if code is not None:
+        with open(filepath, "w", encoding="utf-8") as fout:
+            fout.write(code)
+
+    if not use_docker or running_inside_docker:
+        # already running in a docker container
+        cmd = [
+            sys.executable if lang.startswith("python") else _cmd(lang),
+            f".\\{filename}" if WIN32 else filename,
+        ]
+        with ThreadPoolExecutor(max_workers=1) as executor:
+            future = executor.submit(
+                subprocess.run,
+                cmd,
+                cwd=work_dir,
+                capture_output=True,
+                text=True,
+            )
+            try:
+                result = future.result(timeout=timeout)
+            except TimeoutError:
+                if original_filename is None:
+                    os.remove(filepath)
+                return 1, TIMEOUT_MSG, None
+        if original_filename is None:
+            os.remove(filepath)
+        if result.returncode:
+            logs = result.stderr
+            if original_filename is None:
+                abs_path = str(pathlib.Path(filepath).absolute())
+                logs = logs.replace(str(abs_path), "").replace(filename, "")
+            else:
+                abs_path = str(pathlib.Path(work_dir).absolute()) + PATH_SEPARATOR
+                logs = logs.replace(str(abs_path), "")
+        else:
+            logs = result.stdout
+        return result.returncode, logs, None
+
+    # create a docker client
+    if use_docker and not docker_running:
+        raise RuntimeError(
+            "Docker package is missing or docker is not running. Please make sure docker is running or set use_docker=False."
+        )
+
+    client = docker.from_env()
+
+    image_list = (
+        ["python:3-slim", "python:3", "python:3-windowsservercore"]
+        if use_docker is True
+        else [use_docker]
+        if isinstance(use_docker, str)
+        else use_docker
+    )
+    for image in image_list:
+        # check if the image exists
+        try:
+            client.images.get(image)
+            break
+        except docker.errors.ImageNotFound:
+            # pull the image
+            print("Pulling image", image)
+            try:
+                client.images.pull(image)
+                break
+            except docker.errors.DockerException:
+                print("Failed to pull image", image)
+    # get a randomized str based on current time to wrap the exit code
+    exit_code_str = f"exitcode{time.time()}"
+    abs_path = pathlib.Path(work_dir).absolute()
+    cmd = [
+        "sh",
+        "-c",
+        f'{_cmd(lang)} "{filename}"; exit_code=$?; echo -n {exit_code_str}; echo -n $exit_code; echo {exit_code_str}',
+    ]
+    # create a docker container
+    container = client.containers.run(
+        image,
+        command=cmd,
+        working_dir="/workspace",
+        detach=True,
+        # get absolute path to the working directory
+        volumes={abs_path: {"bind": "/workspace", "mode": "rw"}},
+    )
+    start_time = time.time()
+    while container.status != "exited" and time.time() - start_time < timeout:
+        # Reload the container object
+        container.reload()
+    if container.status != "exited":
+        container.stop()
+        container.remove()
+        if original_filename is None:
+            os.remove(filepath)
+        return 1, TIMEOUT_MSG, image
+    # get the container logs
+    logs = container.logs().decode("utf-8").rstrip()
+    # commit the image
+    tag = _sanitize_filename_for_docker_tag(filename)
+    container.commit(repository="python", tag=tag)
+    # remove the container
+    container.remove()
+    # check if the code executed successfully
+    exit_code = container.attrs["State"]["ExitCode"]
+    if exit_code == 0:
+        # extract the exit code from the logs
+        pattern = re.compile(f"{exit_code_str}(\\d+){exit_code_str}")
+        match = pattern.search(logs)
+        exit_code = 1 if match is None else int(match.group(1))
+        # remove the exit code from the logs
+        logs = logs if match is None else pattern.sub("", logs)
+
+    if original_filename is None:
+        os.remove(filepath)
+    if exit_code:
+        logs = logs.replace(f"/workspace/{filename if original_filename is None else ''}", "")
+    # return the exit code, logs and image
+    return exit_code, logs, f"python:{tag}"
+
+
+_GENERATE_ASSERTIONS_CONFIG = {
+    "prompt": """Given the signature and docstring, write the exactly same number of assertion(s) for the provided example(s) in the docstring, without assertion messages.
+
+func signature:
+{definition}
+assertions:""",
+    "model": FAST_MODEL,
+    "max_tokens": 256,
+    "stop": "\n\n",
+}
+
+
+def _remove_check(response):
+    """Remove the check function from the response."""
+    # find the position of the check function
+    pos = response.find("def check(")
+    if pos == -1:
+        return response
+    return response[:pos]
+
+
+def eval_function_completions(
+    responses: list[str],
+    definition: str,
+    test: Optional[str] = None,
+    entry_point: Optional[str] = None,
+    assertions: Optional[Union[str, Callable[[str], tuple[str, float]]]] = None,
+    timeout: Optional[float] = 3,
+    use_docker: Optional[bool] = True,
+) -> dict:
+    """`(openai<1)` Select a response from a list of responses for the function completion task (using generated assertions), and/or evaluate if the task is successful using a gold test.
+
+    Args:
+        responses: The list of responses.
+        definition: The input definition.
+        test: The test code.
+        entry_point: The name of the function.
+        assertions: The assertion code which serves as a filter of the responses, or an assertion generator.
+            When provided, only the responses that pass the assertions will be considered for the actual test (if provided).
+        timeout: The timeout for executing the code.
+        use_docker: Whether to use docker for code execution.
+
+    Returns:
+        dict: The success metrics.
+    """
+    n = len(responses)
+    if assertions is None:
+        # no assertion filter
+        success_list = []
+        for i in range(n):
+            response = _remove_check(responses[i])
+            code = (
+                f"{response}\n{test}\ncheck({entry_point})"
+                if response.startswith("def")
+                else f"{definition}{response}\n{test}\ncheck({entry_point})"
+            )
+            success = execute_code(code, timeout=timeout, use_docker=use_docker)[0] == 0
+            success_list.append(success)
+        return {
+            "expected_success": 1 - pow(1 - sum(success_list) / n, n),
+            "success": any(s for s in success_list),
+        }
+    if callable(assertions) and n > 1:
+        # assertion generator
+        assertions, gen_cost = assertions(definition)
+    else:
+        assertions, gen_cost = None, 0
+    if n > 1 or test is None:
+        for i in range(n):
+            response = responses[i] = _remove_check(responses[i])
+            code = (
+                f"{response}\n{assertions}" if response.startswith("def") else f"{definition}{response}\n{assertions}"
+            )
+            succeed_assertions = execute_code(code, timeout=timeout, use_docker=use_docker)[0] == 0
+            if succeed_assertions:
+                break
+    else:
+        # just test, no need to check assertions
+        succeed_assertions = False
+        i, response = 0, responses[0]
+    if test is None:
+        # no test code
+        return {
+            "index_selected": i,
+            "succeed_assertions": succeed_assertions,
+            "gen_cost": gen_cost,
+            "assertions": assertions,
+        }
+    code_test = (
+        f"{response}\n{test}\ncheck({entry_point})"
+        if response.startswith("def")
+        else f"{definition}{response}\n{test}\ncheck({entry_point})"
+    )
+    success = execute_code(code_test, timeout=timeout, use_docker=use_docker)[0] == 0
+    return {
+        "index_selected": i,
+        "succeed_assertions": succeed_assertions,
+        "success": success,
+        "gen_cost": gen_cost,
+        "assertions": assertions,
+    }
+
+
+_FUNC_COMPLETION_PROMPT = "# Python 3{definition}"
+_FUNC_COMPLETION_STOP = ["\nclass", "\ndef", "\nif", "\nprint"]
+_IMPLEMENT_CONFIGS = [
+    {"model": FAST_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "temperature": 0, "cache_seed": 0},
+    {"model": FAST_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 7, "cache_seed": 0},
+    {"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "temperature": 0, "cache_seed": 1},
+    {"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 2, "cache_seed": 2},
+    {"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 1, "cache_seed": 2},
+]
+
+
+def create_virtual_env(dir_path: str, **env_args) -> SimpleNamespace:
+    """Creates a python virtual environment and returns the context.
+
+    Args:
+        dir_path (str): Directory path where the env will be created.
+        **env_args: Any extra args to pass to the `EnvBuilder`
+
+    Returns:
+        SimpleNamespace: the virtual env context object.
+    """
+    if not env_args:
+        env_args = {"with_pip": True}
+    env_builder = venv.EnvBuilder(**env_args)
+    env_builder.create(dir_path)
+    return env_builder.ensure_directories(dir_path)
diff --git a/mm_agents/coact/autogen/coding/__init__.py b/mm_agents/coact/autogen/coding/__init__.py
new file mode 100644
index 0000000..71a290e
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/__init__.py
@@ -0,0 +1,22 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Original portions of this file are derived from https://github.com/microsoft/autogen under the MIT License.
+# SPDX-License-Identifier: MIT
+from .base import CodeBlock, CodeExecutor, CodeExtractor, CodeResult
+from .docker_commandline_code_executor import DockerCommandLineCodeExecutor
+from .factory import CodeExecutorFactory
+from .local_commandline_code_executor import LocalCommandLineCodeExecutor
+from .markdown_code_extractor import MarkdownCodeExtractor
+
+__all__ = (
+    "CodeBlock",
+    "CodeExecutor",
+    "CodeExecutorFactory",
+    "CodeExtractor",
+    "CodeResult",
+    "DockerCommandLineCodeExecutor",
+    "LocalCommandLineCodeExecutor",
+    "MarkdownCodeExtractor",
+)
diff --git a/mm_agents/coact/autogen/coding/base.py b/mm_agents/coact/autogen/coding/base.py
new file mode 100644
index 0000000..5883518
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/base.py
@@ -0,0 +1,119 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+from collections.abc import Mapping
+from typing import Any, Literal, Optional, Protocol, TypedDict, Union, runtime_checkable
+
+from pydantic import BaseModel, Field
+
+from ..doc_utils import export_module
+from ..types import UserMessageImageContentPart, UserMessageTextContentPart
+
+__all__ = ("CodeBlock", "CodeExecutionConfig", "CodeExecutor", "CodeExtractor", "CodeResult")
+
+
+@export_module("autogen.coding")
+class CodeBlock(BaseModel):
+    """(Experimental) A class that represents a code block."""
+
+    code: str = Field(description="The code to execute.")
+
+    language: str = Field(description="The language of the code.")
+
+
+@export_module("autogen.coding")
+class CodeResult(BaseModel):
+    """(Experimental) A class that represents the result of a code execution."""
+
+    exit_code: int = Field(description="The exit code of the code execution.")
+
+    output: str = Field(description="The output of the code execution.")
+
+
+@export_module("autogen.coding")
+class CodeExtractor(Protocol):
+    """(Experimental) A code extractor class that extracts code blocks from a message."""
+
+    def extract_code_blocks(
+        self, message: Optional[Union[str, list[Union[UserMessageTextContentPart, UserMessageImageContentPart]]]]
+    ) -> list[CodeBlock]:
+        """(Experimental) Extract code blocks from a message.
+
+        Args:
+            message (str): The message to extract code blocks from.
+
+        Returns:
+            List[CodeBlock]: The extracted code blocks.
+        """
+        ...  # pragma: no cover
+
+
+@runtime_checkable
+@export_module("autogen.coding")
+class CodeExecutor(Protocol):
+    """(Experimental) A code executor class that executes code blocks and returns the result."""
+
+    @property
+    def code_extractor(self) -> CodeExtractor:
+        """(Experimental) The code extractor used by this code executor."""
+        ...  # pragma: no cover
+
+    def execute_code_blocks(self, code_blocks: list[CodeBlock]) -> CodeResult:
+        """(Experimental) Execute code blocks and return the result.
+
+        This method should be implemented by the code executor.
+
+        Args:
+            code_blocks (List[CodeBlock]): The code blocks to execute.
+
+        Returns:
+            CodeResult: The result of the code execution.
+        """
+        ...  # pragma: no cover
+
+    def restart(self) -> None:
+        """(Experimental) Restart the code executor.
+
+        This method should be implemented by the code executor.
+
+        This method is called when the agent is reset.
+        """
+        ...  # pragma: no cover
+
+
+class IPythonCodeResult(CodeResult):
+    """(Experimental) A code result class for IPython code executor."""
+
+    output_files: list[str] = Field(
+        default_factory=list,
+        description="The list of files that the executed code blocks generated.",
+    )
+
+
+CodeExecutionConfig = TypedDict(
+    "CodeExecutionConfig",
+    {
+        "executor": Union[Literal["ipython-embedded", "commandline-local"], CodeExecutor],
+        "last_n_messages": Union[int, Literal["auto"]],
+        "timeout": int,
+        "use_docker": Union[bool, str, list[str]],
+        "work_dir": str,
+        "ipython-embedded": Mapping[str, Any],
+        "commandline-local": Mapping[str, Any],
+    },
+    total=False,
+)
+
+
+class CommandLineCodeResult(CodeResult):
+    """(Experimental) A code result class for command line code executor."""
+
+    code_file: Optional[str] = Field(
+        default=None,
+        description="The file that the executed code block was saved to.",
+    )
diff --git a/mm_agents/coact/autogen/coding/docker_commandline_code_executor.py b/mm_agents/coact/autogen/coding/docker_commandline_code_executor.py
new file mode 100644
index 0000000..0a986ca
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/docker_commandline_code_executor.py
@@ -0,0 +1,268 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import atexit
+import logging
+import sys
+import uuid
+from hashlib import md5
+from pathlib import Path
+from time import sleep
+from types import TracebackType
+from typing import Any, ClassVar, Optional, Union
+
+import docker
+from docker.errors import ImageNotFound
+
+from ..code_utils import TIMEOUT_MSG, _cmd
+from ..doc_utils import export_module
+from .base import CodeBlock, CodeExecutor, CodeExtractor, CommandLineCodeResult
+from .markdown_code_extractor import MarkdownCodeExtractor
+from .utils import _get_file_name_from_content, silence_pip
+
+if sys.version_info >= (3, 11):
+    from typing import Self
+else:
+    from typing_extensions import Self
+
+
+def _wait_for_ready(container: Any, timeout: int = 60, stop_time: float = 0.1) -> None:
+    elapsed_time = 0.0
+    while container.status != "running" and elapsed_time < timeout:
+        sleep(stop_time)
+        elapsed_time += stop_time
+        container.reload()
+        continue
+    if container.status != "running":
+        raise ValueError("Container failed to start")
+
+
+__all__ = ("DockerCommandLineCodeExecutor",)
+
+
+@export_module("autogen.coding")
+class DockerCommandLineCodeExecutor(CodeExecutor):
+    DEFAULT_EXECUTION_POLICY: ClassVar[dict[str, bool]] = {
+        "bash": True,
+        "shell": True,
+        "sh": True,
+        "pwsh": True,
+        "powershell": True,
+        "ps1": True,
+        "python": True,
+        "javascript": False,
+        "html": False,
+        "css": False,
+    }
+    LANGUAGE_ALIASES: ClassVar[dict[str, str]] = {"py": "python", "js": "javascript"}
+
+    def __init__(
+        self,
+        image: str = "python:3-slim",
+        container_name: Optional[str] = None,
+        timeout: int = 60,
+        work_dir: Optional[Union[Path, str]] = None,
+        bind_dir: Optional[Union[Path, str]] = None,
+        auto_remove: bool = True,
+        stop_container: bool = True,
+        execution_policies: Optional[dict[str, bool]] = None,
+    ):
+        """(Experimental) A code executor class that executes code through
+        a command line environment in a Docker container.
+
+        The executor first saves each code block in a file in the working
+        directory, and then executes the code file in the container.
+        The executor executes the code blocks in the order they are received.
+        Currently, the executor only supports Python and shell scripts.
+        For Python code, use the language "python" for the code block.
+        For shell scripts, use the language "bash", "shell", or "sh" for the code
+        block.
+
+        Args:
+            image: Docker image to use for code execution. Defaults to "python:3-slim".
+            container_name: Name of the Docker container which is created. If None, will autogenerate a name. Defaults to None.
+            timeout: The timeout for code execution. Defaults to 60.
+            work_dir: The working directory for the code execution. Defaults to Path(".").
+            bind_dir: The directory that will be bound to the code executor container. Useful for cases where you want to spawn
+                the container from within a container. Defaults to work_dir.
+            auto_remove: If true, will automatically remove the Docker container when it is stopped. Defaults to True.
+            stop_container: If true, will automatically stop the
+                container when stop is called, when the context manager exits or when
+                the Python process exits with atext. Defaults to True.
+            execution_policies: A dictionary mapping language names to boolean values that determine
+                whether code in that language should be executed. True means code in that language
+                will be executed, False means it will only be saved to a file. This overrides the
+                default execution policies. Defaults to None.
+
+        Raises:
+            ValueError: On argument error, or if the container fails to start.
+        """
+        work_dir = work_dir if work_dir is not None else Path()
+
+        if timeout < 1:
+            raise ValueError("Timeout must be greater than or equal to 1.")
+
+        if isinstance(work_dir, str):
+            work_dir = Path(work_dir)
+        work_dir.mkdir(exist_ok=True)
+
+        if bind_dir is None:
+            bind_dir = work_dir
+        elif isinstance(bind_dir, str):
+            bind_dir = Path(bind_dir)
+
+        client = docker.from_env()
+        # Check if the image exists
+        try:
+            client.images.get(image)
+        except ImageNotFound:
+            logging.info(f"Pulling image {image}...")
+            # Let the docker exception escape if this fails.
+            client.images.pull(image)
+
+        if container_name is None:
+            container_name = f"autogen-code-exec-{uuid.uuid4()}"
+
+        # Start a container from the image, read to exec commands later
+        self._container = client.containers.create(
+            image,
+            name=container_name,
+            entrypoint="/bin/sh",
+            tty=True,
+            auto_remove=auto_remove,
+            volumes={str(bind_dir.resolve()): {"bind": "/workspace", "mode": "rw"}},
+            working_dir="/workspace",
+        )
+        self._container.start()
+
+        _wait_for_ready(self._container)
+
+        def cleanup() -> None:
+            try:
+                container = client.containers.get(container_name)
+                container.stop()
+            except docker.errors.NotFound:
+                pass
+            atexit.unregister(cleanup)
+
+        if stop_container:
+            atexit.register(cleanup)
+
+        self._cleanup = cleanup
+
+        # Check if the container is running
+        if self._container.status != "running":
+            raise ValueError(f"Failed to start container from image {image}. Logs: {self._container.logs()}")
+
+        self._timeout = timeout
+        self._work_dir: Path = work_dir
+        self._bind_dir: Path = bind_dir
+        self.execution_policies = self.DEFAULT_EXECUTION_POLICY.copy()
+        if execution_policies is not None:
+            self.execution_policies.update(execution_policies)
+
+    @property
+    def timeout(self) -> int:
+        """(Experimental) The timeout for code execution."""
+        return self._timeout
+
+    @property
+    def work_dir(self) -> Path:
+        """(Experimental) The working directory for the code execution."""
+        return self._work_dir
+
+    @property
+    def bind_dir(self) -> Path:
+        """(Experimental) The binding directory for the code execution container."""
+        return self._bind_dir
+
+    @property
+    def code_extractor(self) -> CodeExtractor:
+        """(Experimental) Export a code extractor that can be used by an agent."""
+        return MarkdownCodeExtractor()
+
+    def execute_code_blocks(self, code_blocks: list[CodeBlock]) -> CommandLineCodeResult:
+        """(Experimental) Execute the code blocks and return the result.
+
+        Args:
+            code_blocks (List[CodeBlock]): The code blocks to execute.
+
+        Returns:
+            CommandlineCodeResult: The result of the code execution.
+        """
+        if len(code_blocks) == 0:
+            raise ValueError("No code blocks to execute.")
+
+        outputs = []
+        files = []
+        last_exit_code = 0
+        for code_block in code_blocks:
+            lang = self.LANGUAGE_ALIASES.get(code_block.language.lower(), code_block.language.lower())
+            if lang not in self.DEFAULT_EXECUTION_POLICY:
+                outputs.append(f"Unsupported language {lang}\n")
+                last_exit_code = 1
+                break
+
+            execute_code = self.execution_policies.get(lang, False)
+            code = silence_pip(code_block.code, lang)
+
+            # Check if there is a filename comment
+            try:
+                filename = _get_file_name_from_content(code, self._work_dir)
+            except ValueError:
+                outputs.append("Filename is not in the workspace")
+                last_exit_code = 1
+                break
+
+            if not filename:
+                filename = f"tmp_code_{md5(code.encode()).hexdigest()}.{lang}"
+
+            code_path = self._work_dir / filename
+            with code_path.open("w", encoding="utf-8") as fout:
+                fout.write(code)
+            files.append(code_path)
+
+            if not execute_code:
+                outputs.append(f"Code saved to {code_path!s}\n")
+                continue
+
+            command = ["timeout", str(self._timeout), _cmd(lang), filename]
+            result = self._container.exec_run(command)
+            exit_code = result.exit_code
+            output = result.output.decode("utf-8")
+            if exit_code == 124:
+                output += "\n" + TIMEOUT_MSG
+            outputs.append(output)
+
+            last_exit_code = exit_code
+            if exit_code != 0:
+                break
+
+        code_file = str(files[0]) if files else None
+        return CommandLineCodeResult(exit_code=last_exit_code, output="".join(outputs), code_file=code_file)
+
+    def restart(self) -> None:
+        """(Experimental) Restart the code executor."""
+        self._container.restart()
+        if self._container.status != "running":
+            raise ValueError(f"Failed to restart container. Logs: {self._container.logs()}")
+
+    def stop(self) -> None:
+        """(Experimental) Stop the code executor."""
+        self._cleanup()
+
+    def __enter__(self) -> Self:
+        return self
+
+    def __exit__(
+        self,
+        exc_type: Optional[type[BaseException]],
+        exc_val: Optional[BaseException],
+        exc_tb: Optional[TracebackType],
+    ) -> None:
+        self.stop()
diff --git a/mm_agents/coact/autogen/coding/factory.py b/mm_agents/coact/autogen/coding/factory.py
new file mode 100644
index 0000000..7098fbf
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/factory.py
@@ -0,0 +1,47 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from ..doc_utils import export_module
+from .base import CodeExecutionConfig, CodeExecutor
+
+__all__ = ("CodeExecutorFactory",)
+
+
+@export_module("autogen.coding")
+class CodeExecutorFactory:
+    """(Experimental) A factory class for creating code executors."""
+
+    @staticmethod
+    def create(code_execution_config: CodeExecutionConfig) -> CodeExecutor:
+        """(Experimental) Get a code executor based on the code execution config.
+
+        Args:
+            code_execution_config (Dict): The code execution config,
+                which is a dictionary that must contain the key "executor".
+                The value of the key "executor" can be either a string
+                or an instance of CodeExecutor, in which case the code
+                executor is returned directly.
+
+        Returns:
+            CodeExecutor: The code executor.
+
+        Raises:
+            ValueError: If the code executor is unknown or not specified.
+        """
+        executor = code_execution_config.get("executor")
+        if isinstance(executor, CodeExecutor):
+            # If the executor is already an instance of CodeExecutor, return it.
+            return executor
+        if executor == "ipython-embedded":
+            from .jupyter.embedded_ipython_code_executor import EmbeddedIPythonCodeExecutor
+
+            return EmbeddedIPythonCodeExecutor(**code_execution_config.get("ipython-embedded", {}))
+        elif executor == "commandline-local":
+            from .local_commandline_code_executor import LocalCommandLineCodeExecutor
+
+            return LocalCommandLineCodeExecutor(**code_execution_config.get("commandline-local", {}))
+        else:
+            raise ValueError(f"Unknown code executor {executor}")
diff --git a/mm_agents/coact/autogen/coding/func_with_reqs.py b/mm_agents/coact/autogen/coding/func_with_reqs.py
new file mode 100644
index 0000000..e75a21e
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/func_with_reqs.py
@@ -0,0 +1,202 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import functools
+import importlib
+import inspect
+from dataclasses import dataclass, field
+from importlib.abc import SourceLoader
+from textwrap import dedent, indent
+from typing import Any, Callable, Generic, TypeVar, Union
+
+from typing_extensions import ParamSpec
+
+T = TypeVar("T")
+P = ParamSpec("P")
+
+
+def _to_code(func: Union["FunctionWithRequirements[T, P]", Callable[P, T], "FunctionWithRequirementsStr"]) -> str:
+    if isinstance(func, FunctionWithRequirementsStr):
+        return func.func
+
+    code = inspect.getsource(func)
+    # Strip the decorator
+    if code.startswith("@"):
+        code = code[code.index("\n") + 1 :]
+    return code
+
+
+@dataclass
+class Alias:
+    name: str
+    alias: str
+
+
+@dataclass
+class ImportFromModule:
+    module: str
+    imports: list[Union[str, Alias]]
+
+
+Import = Union[str, ImportFromModule, Alias]
+
+
+def _import_to_str(im: Import) -> str:
+    if isinstance(im, str):
+        return f"import {im}"
+    elif isinstance(im, Alias):
+        return f"import {im.name} as {im.alias}"
+    else:
+
+        def to_str(i: Union[str, Alias]) -> str:
+            if isinstance(i, str):
+                return i
+            else:
+                return f"{i.name} as {i.alias}"
+
+        imports = ", ".join(map(to_str, im.imports))
+        return f"from {im.module} import {imports}"
+
+
+class _StringLoader(SourceLoader):
+    def __init__(self, data: str):
+        self.data = data
+
+    def get_source(self, fullname: str) -> str:
+        return self.data
+
+    def get_data(self, path: str) -> bytes:
+        return self.data.encode("utf-8")
+
+    def get_filename(self, fullname: str) -> str:
+        return "<not a real path>/" + fullname + ".py"
+
+
+@dataclass
+class FunctionWithRequirementsStr:
+    func: str
+    _compiled_func: Callable[..., Any]
+    _func_name: str
+    python_packages: list[str] = field(default_factory=list)
+    global_imports: list[Import] = field(default_factory=list)
+
+    def __init__(self, func: str, python_packages: list[str] = [], global_imports: list[Import] = []):
+        self.func = func
+        self.python_packages = python_packages
+        self.global_imports = global_imports
+
+        module_name = "func_module"
+        loader = _StringLoader(func)
+        spec = importlib.util.spec_from_loader(module_name, loader)
+        if spec is None:
+            raise ValueError("Could not create spec")
+        module = importlib.util.module_from_spec(spec)
+        if spec.loader is None:
+            raise ValueError("Could not create loader")
+
+        try:
+            spec.loader.exec_module(module)
+        except Exception as e:
+            raise ValueError(f"Could not compile function: {e}") from e
+
+        functions = inspect.getmembers(module, inspect.isfunction)
+        if len(functions) != 1:
+            raise ValueError("The string must contain exactly one function")
+
+        self._func_name, self._compiled_func = functions[0]
+
+    def __call__(self, *args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError("String based function with requirement objects are not directly callable")
+
+
+@dataclass
+class FunctionWithRequirements(Generic[T, P]):
+    func: Callable[P, T]
+    python_packages: list[str] = field(default_factory=list)
+    global_imports: list[Import] = field(default_factory=list)
+
+    @classmethod
+    def from_callable(
+        cls, func: Callable[P, T], python_packages: list[str] = [], global_imports: list[Import] = []
+    ) -> "FunctionWithRequirements[T, P]":
+        return cls(python_packages=python_packages, global_imports=global_imports, func=func)
+
+    @staticmethod
+    def from_str(
+        func: str, python_packages: list[str] = [], global_imports: list[Import] = []
+    ) -> FunctionWithRequirementsStr:
+        return FunctionWithRequirementsStr(func=func, python_packages=python_packages, global_imports=global_imports)
+
+    # Type this based on F
+    def __call__(self, *args: P.args, **kwargs: P.kwargs) -> T:
+        return self.func(*args, **kwargs)
+
+
+def with_requirements(
+    python_packages: list[str] = [], global_imports: list[Import] = []
+) -> Callable[[Callable[P, T]], FunctionWithRequirements[T, P]]:
+    """Decorate a function with package and import requirements
+
+    Args:
+        python_packages (List[str], optional): Packages required to function. Can include version info.. Defaults to [].
+        global_imports (List[Import], optional): Required imports. Defaults to [].
+
+    Returns:
+        Callable[[Callable[P, T]], FunctionWithRequirements[T, P]]: The decorated function
+    """
+
+    def wrapper(func: Callable[P, T]) -> FunctionWithRequirements[T, P]:
+        func_with_reqs = FunctionWithRequirements(
+            python_packages=python_packages, global_imports=global_imports, func=func
+        )
+
+        functools.update_wrapper(func_with_reqs, func)
+        return func_with_reqs
+
+    return wrapper
+
+
+def _build_python_functions_file(
+    funcs: list[Union[FunctionWithRequirements[Any, P], Callable[..., Any], FunctionWithRequirementsStr]],
+) -> str:
+    # First collect all global imports
+    global_imports: set[str] = set()
+    for func in funcs:
+        if isinstance(func, (FunctionWithRequirements, FunctionWithRequirementsStr)):
+            global_imports.update(map(_import_to_str, func.global_imports))
+
+    content = "\n".join(global_imports) + "\n\n"
+
+    for func in funcs:
+        content += _to_code(func) + "\n\n"
+
+    return content
+
+
+def to_stub(func: Union[Callable[..., Any], FunctionWithRequirementsStr]) -> str:
+    """Generate a stub for a function as a string
+
+    Args:
+        func (Callable[..., Any]): The function to generate a stub for
+
+    Returns:
+        str: The stub for the function
+    """
+    if isinstance(func, FunctionWithRequirementsStr):
+        return to_stub(func._compiled_func)
+
+    content = f"def {func.__name__}{inspect.signature(func)}:\n"
+    docstring = func.__doc__
+
+    if docstring:
+        docstring = dedent(docstring)
+        docstring = '"""' + docstring + '"""'
+        docstring = indent(docstring, "    ")
+        content += docstring + "\n"
+
+    content += "    ..."
+    return content
diff --git a/mm_agents/coact/autogen/coding/jupyter/__init__.py b/mm_agents/coact/autogen/coding/jupyter/__init__.py
new file mode 100644
index 0000000..c9cd40d
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/__init__.py
@@ -0,0 +1,23 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Original portions of this file are derived from https://github.com/microsoft/autogen under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .base import JupyterConnectable, JupyterConnectionInfo
+from .docker_jupyter_server import DockerJupyterServer
+from .embedded_ipython_code_executor import EmbeddedIPythonCodeExecutor
+from .jupyter_client import JupyterClient
+from .jupyter_code_executor import JupyterCodeExecutor
+from .local_jupyter_server import LocalJupyterServer
+
+__all__ = [
+    "DockerJupyterServer",
+    "EmbeddedIPythonCodeExecutor",
+    "JupyterClient",
+    "JupyterCodeExecutor",
+    "JupyterConnectable",
+    "JupyterConnectionInfo",
+    "LocalJupyterServer",
+]
diff --git a/mm_agents/coact/autogen/coding/jupyter/base.py b/mm_agents/coact/autogen/coding/jupyter/base.py
new file mode 100644
index 0000000..09669b3
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/base.py
@@ -0,0 +1,36 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from dataclasses import dataclass
+from typing import Optional, Protocol, runtime_checkable
+
+from ...doc_utils import export_module
+
+
+@dataclass
+@export_module("autogen.coding.jupyter")
+class JupyterConnectionInfo:
+    """(Experimental)"""
+
+    host: str
+    """`str` - Host of the Jupyter gateway server"""
+    use_https: bool
+    """`bool` - Whether to use HTTPS"""
+    port: Optional[int] = None
+    """`Optional[int]` - Port of the Jupyter gateway server. If None, the default port is used"""
+    token: Optional[str] = None
+    """`Optional[str]` - Token for authentication. If None, no token is used"""
+
+
+@runtime_checkable
+@export_module("autogen.coding.jupyter")
+class JupyterConnectable(Protocol):
+    """(Experimental)"""
+
+    @property
+    def connection_info(self) -> JupyterConnectionInfo:
+        """Return the connection information for this connectable."""
+        pass
diff --git a/mm_agents/coact/autogen/coding/jupyter/docker_jupyter_server.py b/mm_agents/coact/autogen/coding/jupyter/docker_jupyter_server.py
new file mode 100644
index 0000000..9d558f0
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/docker_jupyter_server.py
@@ -0,0 +1,167 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import atexit
+import io
+import logging
+import secrets
+import sys
+import uuid
+from pathlib import Path
+from types import TracebackType
+from typing import Optional
+
+import docker
+
+from ...doc_utils import export_module
+
+if sys.version_info >= (3, 11):
+    from typing import Self
+else:
+    from typing_extensions import Self
+
+from ..docker_commandline_code_executor import _wait_for_ready
+from .base import JupyterConnectable, JupyterConnectionInfo
+from .import_utils import require_jupyter_kernel_gateway_installed
+from .jupyter_client import JupyterClient
+
+
+@require_jupyter_kernel_gateway_installed()
+@export_module("autogen.coding.jupyter")
+class DockerJupyterServer(JupyterConnectable):
+    DEFAULT_DOCKERFILE = """FROM quay.io/jupyter/docker-stacks-foundation
+
+SHELL ["/bin/bash", "-o", "pipefail", "-c"]
+
+USER ${NB_UID}
+RUN mamba install --yes jupyter_kernel_gateway ipykernel && \
+    mamba clean --all -f -y && \
+    fix-permissions "${CONDA_DIR}" && \
+    fix-permissions "/home/${NB_USER}"
+
+ENV TOKEN="UNSET"
+CMD python -m jupyter kernelgateway --KernelGatewayApp.ip=0.0.0.0 \
+    --KernelGatewayApp.port=8888 \
+    --KernelGatewayApp.auth_token="${TOKEN}" \
+    --JupyterApp.answer_yes=true \
+    --JupyterWebsocketPersonality.list_kernels=true
+
+EXPOSE 8888
+
+WORKDIR "${HOME}"
+"""
+
+    class GenerateToken:
+        pass
+
+    def __init__(
+        self,
+        *,
+        custom_image_name: Optional[str] = None,
+        container_name: Optional[str] = None,
+        auto_remove: bool = True,
+        stop_container: bool = True,
+        docker_env: dict[str, str] = {},
+        token: str | GenerateToken = GenerateToken(),
+    ):
+        """Start a Jupyter kernel gateway server in a Docker container.
+
+        Args:
+            custom_image_name (Optional[str], optional): Custom image to use. If this is None,
+                then the bundled image will be built and used. The default image is based on
+                quay.io/jupyter/docker-stacks-foundation and extended to include jupyter_kernel_gateway
+            container_name (Optional[str], optional): Name of the container to start.
+                A name will be generated if None.
+            auto_remove (bool, optional): If true the Docker container will be deleted
+                when it is stopped.
+            stop_container (bool, optional): If true the container will be stopped,
+                either by program exit or using the context manager
+            docker_env (Dict[str, str], optional): Extra environment variables to pass
+                to the running Docker container.
+            token (Union[str, GenerateToken], optional): Token to use for authentication.
+                If GenerateToken is used, a random token will be generated. Empty string
+                will be unauthenticated.
+        """
+        if container_name is None:
+            container_name = f"autogen-jupyterkernelgateway-{uuid.uuid4()}"
+
+        client = docker.from_env()
+        if custom_image_name is None:
+            image_name = "autogen-jupyterkernelgateway"
+            # Make sure the image exists
+            try:
+                client.images.get(image_name)
+            except docker.errors.ImageNotFound:
+                # Build the image
+                # Get this script directory
+                here = Path(__file__).parent
+                dockerfile = io.BytesIO(self.DEFAULT_DOCKERFILE.encode("utf-8"))
+                logging.info(f"Image {image_name} not found. Building it now.")
+                client.images.build(path=here, fileobj=dockerfile, tag=image_name)
+                logging.info(f"Image {image_name} built successfully.")
+        else:
+            image_name = custom_image_name
+            # Check if the image exists
+            try:
+                client.images.get(image_name)
+            except docker.errors.ImageNotFound:
+                raise ValueError(f"Custom image {image_name} does not exist")
+
+        if isinstance(token, DockerJupyterServer.GenerateToken):
+            self._token = secrets.token_hex(32)
+        else:
+            self._token = token
+
+        # Run the container
+        env = {"TOKEN": self._token}
+        env.update(docker_env)
+        container = client.containers.run(
+            image_name,
+            detach=True,
+            auto_remove=auto_remove,
+            environment=env,
+            publish_all_ports=True,
+            name=container_name,
+        )
+        _wait_for_ready(container)
+        container_ports = container.ports
+        self._port = int(container_ports["8888/tcp"][0]["HostPort"])
+        self._container_id = container.id
+
+        def cleanup() -> None:
+            try:
+                inner_container = client.containers.get(container.id)
+                inner_container.stop()
+            except docker.errors.NotFound:
+                pass
+
+            atexit.unregister(cleanup)
+
+        if stop_container:
+            atexit.register(cleanup)
+
+        self._cleanup_func = cleanup
+        self._stop_container = stop_container
+
+    @property
+    def connection_info(self) -> JupyterConnectionInfo:
+        return JupyterConnectionInfo(host="127.0.0.1", use_https=False, port=self._port, token=self._token)
+
+    def stop(self) -> None:
+        self._cleanup_func()
+
+    def get_client(self) -> JupyterClient:
+        return JupyterClient(self.connection_info)
+
+    def __enter__(self) -> Self:
+        return self
+
+    def __exit__(
+        self, exc_type: Optional[type[BaseException]], exc_val: Optional[BaseException], exc_tb: Optional[TracebackType]
+    ) -> None:
+        self.stop()
diff --git a/mm_agents/coact/autogen/coding/jupyter/embedded_ipython_code_executor.py b/mm_agents/coact/autogen/coding/jupyter/embedded_ipython_code_executor.py
new file mode 100644
index 0000000..8bfc0bb
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/embedded_ipython_code_executor.py
@@ -0,0 +1,182 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import base64
+import json
+import os
+import re
+import uuid
+from pathlib import Path
+from queue import Empty
+from typing import Any
+
+from pydantic import BaseModel, Field, field_validator
+
+from ...doc_utils import export_module
+from ...import_utils import optional_import_block, require_optional_import
+from ..base import CodeBlock, CodeExtractor, IPythonCodeResult
+from ..markdown_code_extractor import MarkdownCodeExtractor
+from .import_utils import require_jupyter_kernel_gateway_installed
+
+with optional_import_block():
+    from jupyter_client import KernelManager  # type: ignore[attr-defined]
+    from jupyter_client.kernelspec import KernelSpecManager
+
+__all__ = ["EmbeddedIPythonCodeExecutor"]
+
+
+@require_optional_import("jupyter_client", "jupyter-executor")
+@require_jupyter_kernel_gateway_installed()
+@export_module("autogen.coding.jupyter")
+class EmbeddedIPythonCodeExecutor(BaseModel):
+    """(Experimental) A code executor class that executes code statefully using an embedded
+    IPython kernel managed by this class.
+
+    **This will execute LLM generated code on the local machine.**
+
+    Each execution is stateful and can access variables created from previous
+    executions in the same session. The kernel must be installed before using
+    this class. The kernel can be installed using the following command:
+    `python -m ipykernel install --user --name {kernel_name}`
+    where `kernel_name` is the name of the kernel to install.
+    """
+
+    timeout: int = Field(default=60, ge=1, description="The timeout for code execution.")
+    kernel_name: str = Field(default="python3", description="The kernel name to use. Make sure it is installed.")
+    output_dir: str = Field(default=".", description="The directory to save output files.")
+
+    @field_validator("output_dir")
+    @classmethod
+    def _output_dir_must_exist(cls, value: str) -> str:
+        if not os.path.exists(value):
+            raise ValueError(f"Output directory {value} does not exist.")
+        return value
+
+    def __init__(self, **kwargs: Any):
+        super().__init__(**kwargs)
+        # Check if the kernel is installed.
+        if self.kernel_name not in KernelSpecManager().find_kernel_specs():
+            raise ValueError(
+                f"Kernel {self.kernel_name} is not installed. "
+                "Please first install it with "
+                f"`python -m ipykernel install --user --name {self.kernel_name}`."
+            )
+        self._kernel_manager = KernelManager(kernel_name=self.kernel_name)
+        self._kernel_manager.start_kernel()
+        self._kernel_client = self._kernel_manager.client()
+        self._kernel_client.start_channels()
+        self._timeout = self.timeout
+        self._kernel_name = self.kernel_name
+        self._output_dir = Path(self.output_dir)
+
+    @property
+    def code_extractor(self) -> CodeExtractor:
+        """(Experimental) Export a code extractor that can be used by an agent."""
+        return MarkdownCodeExtractor()
+
+    def execute_code_blocks(self, code_blocks: list[CodeBlock]) -> IPythonCodeResult:
+        """(Experimental) Execute a list of code blocks and return the result.
+
+        This method executes a list of code blocks as cells in an IPython kernel
+        managed by this class.
+        See: https://jupyter-client.readthedocs.io/en/stable/messaging.html
+        for the message protocol.
+
+        Args:
+            code_blocks (List[CodeBlock]): A list of code blocks to execute.
+
+        Returns:
+            IPythonCodeResult: The result of the code execution.
+        """
+        self._kernel_client.wait_for_ready()
+        outputs = []
+        output_files = []
+        for code_block in code_blocks:
+            code = self._process_code(code_block.code)
+            self._kernel_client.execute(code, store_history=True)
+            while True:
+                try:
+                    msg = self._kernel_client.get_iopub_msg(timeout=self._timeout)
+                    msg_type = msg["msg_type"]
+                    content = msg["content"]
+                    if msg_type in ["execute_result", "display_data"]:
+                        for data_type, data in content["data"].items():
+                            if data_type == "text/plain":
+                                # Output is a text.
+                                outputs.append(data)
+                            elif data_type.startswith("image/"):
+                                # Output is an image.
+                                path = self._save_image(data)
+                                outputs.append(f"Image data saved to {path}")
+                                output_files.append(path)
+                            elif data_type == "text/html":
+                                # Output is an html.
+                                path = self._save_html(data)
+                                outputs.append(f"HTML data saved to {path}")
+                                output_files.append(path)
+                            else:
+                                # Output raw data.
+                                outputs.append(json.dumps(data))
+                    elif msg_type == "stream":
+                        # Output is a text.
+                        outputs.append(content["text"])
+                    elif msg_type == "error":
+                        # Output is an error.
+                        return IPythonCodeResult(
+                            exit_code=1,
+                            output=f"ERROR: {content['ename']}: {content['evalue']}\n{content['traceback']}",
+                        )
+                    if msg_type == "status" and content["execution_state"] == "idle":
+                        break
+                # handle time outs.
+                except Empty:
+                    return IPythonCodeResult(
+                        exit_code=1,
+                        output=f"ERROR: Timeout waiting for output from code block: {code_block.code}",
+                    )
+        # We return the full output.
+        return IPythonCodeResult(
+            exit_code=0, output="\n".join([str(output) for output in outputs]), output_files=output_files
+        )
+
+    def restart(self) -> None:
+        """(Experimental) Restart a new session."""
+        self._kernel_client.stop_channels()
+        self._kernel_manager.shutdown_kernel()
+        self._kernel_manager = KernelManager(kernel_name=self.kernel_name)
+        self._kernel_manager.start_kernel()
+        self._kernel_client = self._kernel_manager.client()
+        self._kernel_client.start_channels()
+
+    def _save_image(self, image_data_base64: str) -> str:
+        """Save image data to a file."""
+        image_data = base64.b64decode(image_data_base64)
+        # Randomly generate a filename.
+        filename = f"{uuid.uuid4().hex}.png"
+        path = os.path.join(self.output_dir, filename)
+        with open(path, "wb") as f:
+            f.write(image_data)
+        return os.path.abspath(path)
+
+    def _save_html(self, html_data: str) -> str:
+        """Save html data to a file."""
+        # Randomly generate a filename.
+        filename = f"{uuid.uuid4().hex}.html"
+        path = os.path.join(self.output_dir, filename)
+        with open(path, "w") as f:
+            f.write(html_data)
+        return os.path.abspath(path)
+
+    def _process_code(self, code: str) -> str:
+        """Process code before execution."""
+        # Find lines that start with `! pip install` and make sure "-qqq" flag is added.
+        lines = code.split("\n")
+        for i, line in enumerate(lines):
+            # use regex to find lines that start with `! pip install` or `!pip install`.
+            match = re.search(r"^! ?pip install", line)
+            if match is not None and "-qqq" not in line:
+                lines[i] = line.replace(match.group(0), match.group(0) + " -qqq")
+        return "\n".join(lines)
diff --git a/mm_agents/coact/autogen/coding/jupyter/import_utils.py b/mm_agents/coact/autogen/coding/jupyter/import_utils.py
new file mode 100644
index 0000000..434a8ab
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/import_utils.py
@@ -0,0 +1,82 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import subprocess
+from functools import lru_cache
+from logging import getLogger
+from typing import Callable, TypeVar
+
+from ...import_utils import patch_object
+
+logger = getLogger(__name__)
+
+__all__ = ["require_jupyter_kernel_gateway_installed", "skip_on_missing_jupyter_kernel_gateway"]
+
+
+@lru_cache
+def is_jupyter_kernel_gateway_installed() -> bool:
+    """Check if jupyter-kernel-gateway is installed."""
+    try:
+        subprocess.run(
+            ["jupyter", "kernelgateway", "--version"],
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            check=True,
+        )
+        return True
+    except (subprocess.CalledProcessError, FileNotFoundError):
+        logger.warning(
+            "jupyter-kernel-gateway is required for JupyterCodeExecutor, please install it with `pip install ag2[jupyter-executor]`"
+        )
+        return False
+
+
+T = TypeVar("T")
+
+
+def require_jupyter_kernel_gateway_installed() -> Callable[[T], T]:
+    """Decorator that checks if jupyter-kernel-gateway is installed before function execution.
+
+    Returns:
+        Callable[[T], T]: A decorator function that either:
+            - Returns the original function unchanged if jupyter-kernel-gateway is installed
+            - Returns a patched version of the function that will raise a helpful error indicating the missing dependency when called
+    """
+    if is_jupyter_kernel_gateway_installed():
+
+        def decorator(o: T) -> T:
+            return o
+
+    else:
+
+        def decorator(o: T) -> T:
+            return patch_object(o, missing_modules={}, dep_target="jupyter-executor")
+
+    return decorator
+
+
+def skip_on_missing_jupyter_kernel_gateway() -> Callable[[T], T]:
+    """Decorator to skip a test if an optional module is missing"""
+    # Add pytest.mark.jupyter_executor decorator
+    mark_name = "jupyter_executor"
+
+    if is_jupyter_kernel_gateway_installed():
+
+        def decorator(o: T) -> T:
+            import pytest
+
+            pytest_mark_o = getattr(pytest.mark, mark_name)(o)
+            return pytest_mark_o  # type: ignore[no-any-return]
+
+    else:
+
+        def decorator(o: T) -> T:
+            import pytest
+
+            pytest_mark_o = getattr(pytest.mark, mark_name)(o)
+            return pytest.mark.skip(  # type: ignore[return-value,no-any-return]
+                reason="jupyter-kernel-gateway is required for JupyterCodeExecutor, please install it with `pip install ag2[jupyter-executor]`"
+            )(pytest_mark_o)
+
+    return decorator
diff --git a/mm_agents/coact/autogen/coding/jupyter/jupyter_client.py b/mm_agents/coact/autogen/coding/jupyter/jupyter_client.py
new file mode 100644
index 0000000..1ef158a
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/jupyter_client.py
@@ -0,0 +1,231 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import datetime
+import json
+import sys
+import uuid
+from dataclasses import dataclass
+from types import TracebackType
+from typing import Any, Optional, cast
+
+from ...doc_utils import export_module
+
+if sys.version_info >= (3, 11):
+    from typing import Self
+else:
+    from typing_extensions import Self
+
+
+import requests
+from requests.adapters import HTTPAdapter, Retry
+
+from ...import_utils import optional_import_block, require_optional_import
+from .base import JupyterConnectionInfo
+
+with optional_import_block():
+    import websocket
+    from websocket import WebSocket
+
+
+@export_module("autogen.coding.jupyter")
+class JupyterClient:
+    def __init__(self, connection_info: JupyterConnectionInfo):
+        """(Experimental) A client for communicating with a Jupyter gateway server.
+
+        Args:
+            connection_info (JupyterConnectionInfo): Connection information
+        """
+        self._connection_info = connection_info
+        self._session = requests.Session()
+        retries = Retry(total=5, backoff_factor=0.1)
+        self._session.mount("http://", HTTPAdapter(max_retries=retries))
+
+    def _get_headers(self) -> dict[str, str]:
+        if self._connection_info.token is None:
+            return {}
+        return {"Authorization": f"token {self._connection_info.token}"}
+
+    def _get_api_base_url(self) -> str:
+        protocol = "https" if self._connection_info.use_https else "http"
+        port = f":{self._connection_info.port}" if self._connection_info.port else ""
+        return f"{protocol}://{self._connection_info.host}{port}"
+
+    def _get_ws_base_url(self) -> str:
+        port = f":{self._connection_info.port}" if self._connection_info.port else ""
+        return f"ws://{self._connection_info.host}{port}"
+
+    def list_kernel_specs(self) -> dict[str, dict[str, str]]:
+        response = self._session.get(f"{self._get_api_base_url()}/api/kernelspecs", headers=self._get_headers())
+        return cast(dict[str, dict[str, str]], response.json())
+
+    def list_kernels(self) -> list[dict[str, str]]:
+        response = self._session.get(f"{self._get_api_base_url()}/api/kernels", headers=self._get_headers())
+        return cast(list[dict[str, str]], response.json())
+
+    def start_kernel(self, kernel_spec_name: str) -> str:
+        """Start a new kernel.
+
+        Args:
+            kernel_spec_name (str): Name of the kernel spec to start
+
+        Returns:
+            str: ID of the started kernel
+        """
+        response = self._session.post(
+            f"{self._get_api_base_url()}/api/kernels",
+            headers=self._get_headers(),
+            json={"name": kernel_spec_name},
+        )
+        return cast(str, response.json()["id"])
+
+    def delete_kernel(self, kernel_id: str) -> None:
+        response = self._session.delete(
+            f"{self._get_api_base_url()}/api/kernels/{kernel_id}", headers=self._get_headers()
+        )
+        response.raise_for_status()
+
+    def restart_kernel(self, kernel_id: str) -> None:
+        response = self._session.post(
+            f"{self._get_api_base_url()}/api/kernels/{kernel_id}/restart", headers=self._get_headers()
+        )
+        response.raise_for_status()
+
+    @require_optional_import("websocket", "jupyter-executor")
+    def get_kernel_client(self, kernel_id: str) -> JupyterKernelClient:
+        ws_url = f"{self._get_ws_base_url()}/api/kernels/{kernel_id}/channels"
+        ws = websocket.create_connection(ws_url, header=self._get_headers())
+        return JupyterKernelClient(ws)
+
+
+@require_optional_import("websocket", "jupyter-executor")
+class JupyterKernelClient:
+    """(Experimental) A client for communicating with a Jupyter kernel."""
+
+    @dataclass
+    class ExecutionResult:
+        @dataclass
+        class DataItem:
+            mime_type: str
+            data: str
+
+        is_ok: bool
+        output: str
+        data_items: list[DataItem]
+
+    def __init__(self, websocket: WebSocket):  # type: ignore[no-any-unimported]
+        self._session_id: str = uuid.uuid4().hex
+        self._websocket: WebSocket = websocket  # type: ignore[no-any-unimported]
+
+    def __enter__(self) -> Self:
+        return self
+
+    def __exit__(
+        self, exc_type: Optional[type[BaseException]], exc_val: Optional[BaseException], exc_tb: Optional[TracebackType]
+    ) -> None:
+        self.stop()
+
+    def stop(self) -> None:
+        self._websocket.close()
+
+    def _send_message(self, *, content: dict[str, Any], channel: str, message_type: str) -> str:
+        timestamp = datetime.datetime.now().isoformat()
+        message_id = uuid.uuid4().hex
+        message = {
+            "header": {
+                "username": "autogen",
+                "version": "5.0",
+                "session": self._session_id,
+                "msg_id": message_id,
+                "msg_type": message_type,
+                "date": timestamp,
+            },
+            "parent_header": {},
+            "channel": channel,
+            "content": content,
+            "metadata": {},
+            "buffers": {},
+        }
+        self._websocket.send_text(json.dumps(message))
+        return message_id
+
+    def _receive_message(self, timeout_seconds: Optional[float]) -> Optional[dict[str, Any]]:
+        self._websocket.settimeout(timeout_seconds)
+        try:
+            data = self._websocket.recv()
+            if isinstance(data, bytes):
+                data = data.decode("utf-8")
+            return cast(dict[str, Any], json.loads(data))
+        except websocket.WebSocketTimeoutException:
+            return None
+
+    def wait_for_ready(self, timeout_seconds: Optional[float] = None) -> bool:
+        message_id = self._send_message(content={}, channel="shell", message_type="kernel_info_request")
+        while True:
+            message = self._receive_message(timeout_seconds)
+            # This means we timed out with no new messages.
+            if message is None:
+                return False
+            if (
+                message.get("parent_header", {}).get("msg_id") == message_id
+                and message["msg_type"] == "kernel_info_reply"
+            ):
+                return True
+
+    def execute(self, code: str, timeout_seconds: Optional[float] = None) -> ExecutionResult:
+        message_id = self._send_message(
+            content={
+                "code": code,
+                "silent": False,
+                "store_history": True,
+                "user_expressions": {},
+                "allow_stdin": False,
+                "stop_on_error": True,
+            },
+            channel="shell",
+            message_type="execute_request",
+        )
+
+        text_output = []
+        data_output = []
+        while True:
+            message = self._receive_message(timeout_seconds)
+            if message is None:
+                return JupyterKernelClient.ExecutionResult(
+                    is_ok=False, output="ERROR: Timeout waiting for output from code block.", data_items=[]
+                )
+
+            # Ignore messages that are not for this execution.
+            if message.get("parent_header", {}).get("msg_id") != message_id:
+                continue
+
+            msg_type = message["msg_type"]
+            content = message["content"]
+            if msg_type in ["execute_result", "display_data"]:
+                for data_type, data in content["data"].items():
+                    if data_type == "text/plain":
+                        text_output.append(data)
+                    elif data_type.startswith("image/") or data_type == "text/html":
+                        data_output.append(self.ExecutionResult.DataItem(mime_type=data_type, data=data))
+                    else:
+                        text_output.append(json.dumps(data))
+            elif msg_type == "stream":
+                text_output.append(content["text"])
+            elif msg_type == "error":
+                # Output is an error.
+                return JupyterKernelClient.ExecutionResult(
+                    is_ok=False,
+                    output=f"ERROR: {content['ename']}: {content['evalue']}\n{content['traceback']}",
+                    data_items=[],
+                )
+            if msg_type == "status" and content["execution_state"] == "idle":
+                break
+
+        return JupyterKernelClient.ExecutionResult(
+            is_ok=True, output="\n".join([str(output) for output in text_output]), data_items=data_output
+        )
diff --git a/mm_agents/coact/autogen/coding/jupyter/jupyter_code_executor.py b/mm_agents/coact/autogen/coding/jupyter/jupyter_code_executor.py
new file mode 100644
index 0000000..baa0057
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/jupyter_code_executor.py
@@ -0,0 +1,160 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import base64
+import json
+import os
+import sys
+import uuid
+from pathlib import Path
+from types import TracebackType
+from typing import Optional, Union
+
+from ...doc_utils import export_module
+
+if sys.version_info >= (3, 11):
+    from typing import Self
+else:
+    from typing_extensions import Self
+
+from ..base import CodeBlock, CodeExecutor, CodeExtractor, IPythonCodeResult
+from ..markdown_code_extractor import MarkdownCodeExtractor
+from ..utils import silence_pip
+from .base import JupyterConnectable, JupyterConnectionInfo
+from .jupyter_client import JupyterClient
+
+
+@export_module("autogen.coding.jupyter")
+class JupyterCodeExecutor(CodeExecutor):
+    def __init__(
+        self,
+        jupyter_server: Union[JupyterConnectable, JupyterConnectionInfo],
+        kernel_name: str = "python3",
+        timeout: int = 60,
+        output_dir: Union[Path, str] = Path(),
+    ):
+        """(Experimental) A code executor class that executes code statefully using
+        a Jupyter server supplied to this class.
+
+        Each execution is stateful and can access variables created from previous
+        executions in the same session.
+
+        Args:
+            jupyter_server (Union[JupyterConnectable, JupyterConnectionInfo]): The Jupyter server to use.
+            timeout (int): The timeout for code execution, by default 60.
+            kernel_name (str): The kernel name to use. Make sure it is installed.
+                By default, it is "python3".
+            output_dir (str): The directory to save output files, by default ".".
+        """
+        if timeout < 1:
+            raise ValueError("Timeout must be greater than or equal to 1.")
+
+        if isinstance(output_dir, str):
+            output_dir = Path(output_dir)
+
+        if not output_dir.exists():
+            raise ValueError(f"Output directory {output_dir} does not exist.")
+
+        if isinstance(jupyter_server, JupyterConnectable):
+            self._connection_info = jupyter_server.connection_info
+        elif isinstance(jupyter_server, JupyterConnectionInfo):
+            self._connection_info = jupyter_server
+        else:
+            raise ValueError("jupyter_server must be a JupyterConnectable or JupyterConnectionInfo.")
+
+        self._jupyter_client = JupyterClient(self._connection_info)
+        available_kernels = self._jupyter_client.list_kernel_specs()
+        if kernel_name not in available_kernels["kernelspecs"]:
+            raise ValueError(f"Kernel {kernel_name} is not installed.")
+
+        self._kernel_id = self._jupyter_client.start_kernel(kernel_name)
+        self._kernel_name = kernel_name
+        self._jupyter_kernel_client = self._jupyter_client.get_kernel_client(self._kernel_id)
+        self._timeout = timeout
+        self._output_dir = output_dir
+
+    @property
+    def code_extractor(self) -> CodeExtractor:
+        """(Experimental) Export a code extractor that can be used by an agent."""
+        return MarkdownCodeExtractor()
+
+    def execute_code_blocks(self, code_blocks: list[CodeBlock]) -> IPythonCodeResult:
+        """(Experimental) Execute a list of code blocks and return the result.
+
+        This method executes a list of code blocks as cells in the Jupyter kernel.
+        See: https://jupyter-client.readthedocs.io/en/stable/messaging.html
+        for the message protocol.
+
+        Args:
+            code_blocks (List[CodeBlock]): A list of code blocks to execute.
+
+        Returns:
+            IPythonCodeResult: The result of the code execution.
+        """
+        self._jupyter_kernel_client.wait_for_ready()
+        outputs = []
+        output_files = []
+        for code_block in code_blocks:
+            code = silence_pip(code_block.code, code_block.language)
+            result = self._jupyter_kernel_client.execute(code, timeout_seconds=self._timeout)
+            if result.is_ok:
+                outputs.append(result.output)
+                for data in result.data_items:
+                    if data.mime_type == "image/png":
+                        path = self._save_image(data.data)
+                        outputs.append(f"Image data saved to {path}")
+                        output_files.append(path)
+                    elif data.mime_type == "text/html":
+                        path = self._save_html(data.data)
+                        outputs.append(f"HTML data saved to {path}")
+                        output_files.append(path)
+                    else:
+                        outputs.append(json.dumps(data.data))
+            else:
+                return IPythonCodeResult(
+                    exit_code=1,
+                    output=f"ERROR: {result.output}",
+                )
+
+        return IPythonCodeResult(
+            exit_code=0, output="\n".join([str(output) for output in outputs]), output_files=output_files
+        )
+
+    def restart(self) -> None:
+        """(Experimental) Restart a new session."""
+        self._jupyter_client.restart_kernel(self._kernel_id)
+        self._jupyter_kernel_client = self._jupyter_client.get_kernel_client(self._kernel_id)
+
+    def _save_image(self, image_data_base64: str) -> str:
+        """Save image data to a file."""
+        image_data = base64.b64decode(image_data_base64)
+        # Randomly generate a filename.
+        filename = f"{uuid.uuid4().hex}.png"
+        path = os.path.join(self._output_dir, filename)
+        with open(path, "wb") as f:
+            f.write(image_data)
+        return os.path.abspath(path)
+
+    def _save_html(self, html_data: str) -> str:
+        """Save html data to a file."""
+        # Randomly generate a filename.
+        filename = f"{uuid.uuid4().hex}.html"
+        path = os.path.join(self._output_dir, filename)
+        with open(path, "w") as f:
+            f.write(html_data)
+        return os.path.abspath(path)
+
+    def stop(self) -> None:
+        """Stop the kernel."""
+        self._jupyter_client.delete_kernel(self._kernel_id)
+
+    def __enter__(self) -> Self:
+        return self
+
+    def __exit__(
+        self, exc_type: Optional[type[BaseException]], exc_val: Optional[BaseException], exc_tb: Optional[TracebackType]
+    ) -> None:
+        self.stop()
diff --git a/mm_agents/coact/autogen/coding/jupyter/local_jupyter_server.py b/mm_agents/coact/autogen/coding/jupyter/local_jupyter_server.py
new file mode 100644
index 0000000..f7ad196
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/jupyter/local_jupyter_server.py
@@ -0,0 +1,172 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import atexit
+import json
+import secrets
+import signal
+import subprocess
+import sys
+from types import TracebackType
+from typing import Optional
+
+from ...doc_utils import export_module
+
+if sys.version_info >= (3, 11):
+    from typing import Self
+else:
+    from typing_extensions import Self
+
+from .base import JupyterConnectable, JupyterConnectionInfo
+from .import_utils import require_jupyter_kernel_gateway_installed
+from .jupyter_client import JupyterClient
+
+
+@require_jupyter_kernel_gateway_installed()
+@export_module("autogen.coding.jupyter")
+class LocalJupyterServer(JupyterConnectable):
+    class GenerateToken:
+        pass
+
+    def __init__(
+        self,
+        ip: str = "127.0.0.1",
+        port: Optional[int] = None,
+        token: str | GenerateToken = GenerateToken(),
+        log_file: str = "jupyter_gateway.log",
+        log_level: str = "INFO",
+        log_max_bytes: int = 1048576,
+        log_backup_count: int = 3,
+    ):
+        """Runs a Jupyter Kernel Gateway server locally.
+
+        Args:
+            ip (str, optional): IP address to bind to. Defaults to "127.0.0.1".
+            port (Optional[int], optional): Port to use, if None it automatically selects a port. Defaults to None.
+            token (Union[str, GenerateToken], optional): Token to use for Jupyter server. By default will generate a token. Using None will use no token for authentication. Defaults to GenerateToken().
+            log_file (str, optional): File for Jupyter Kernel Gateway logs. Defaults to "jupyter_gateway.log".
+            log_level (str, optional): Level for Jupyter Kernel Gateway logs. Defaults to "INFO".
+            log_max_bytes (int, optional): Max logfile size. Defaults to 1048576.
+            log_backup_count (int, optional): Number of backups for rotating log. Defaults to 3.
+        """
+        # Remove as soon as https://github.com/jupyter-server/kernel_gateway/issues/398 is fixed
+        if sys.platform == "win32":
+            raise ValueError("LocalJupyterServer is not supported on Windows due to kernelgateway bug.")
+
+        # Check Jupyter gateway server is installed
+        try:
+            subprocess.run(
+                [sys.executable, "-m", "jupyter", "kernelgateway", "--version"],
+                check=True,
+                capture_output=True,
+                text=True,
+            )
+        except subprocess.CalledProcessError:
+            raise ValueError(
+                "Jupyter gateway server is not installed. Please install it with `pip install jupyter_kernel_gateway`."
+            )
+
+        self.ip: str = ip
+
+        if isinstance(token, LocalJupyterServer.GenerateToken):
+            token = secrets.token_hex(32)
+
+        self.token: str = token
+        self._subprocess: subprocess.Popen[str]
+        logging_config = {
+            "handlers": {
+                "file": {
+                    "class": "logging.handlers.RotatingFileHandler",
+                    "level": log_level,
+                    "maxBytes": log_max_bytes,
+                    "backupCount": log_backup_count,
+                    "filename": log_file,
+                }
+            },
+            "loggers": {"KernelGatewayApp": {"level": log_level, "handlers": ["file", "console"]}},
+        }
+
+        # Run Jupyter gateway server with detached subprocess
+        args = [
+            sys.executable,
+            "-m",
+            "jupyter",
+            "kernelgateway",
+            "--KernelGatewayApp.ip",
+            ip,
+            "--KernelGatewayApp.auth_token",
+            token,
+            "--JupyterApp.answer_yes",
+            "true",
+            "--JupyterApp.logging_config",
+            json.dumps(logging_config),
+            "--JupyterWebsocketPersonality.list_kernels",
+            "true",
+        ]
+        if port is not None:
+            args.extend(["--KernelGatewayApp.port", str(port)])
+            args.extend(["--KernelGatewayApp.port_retries", "0"])
+        self._subprocess = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+
+        # Satisfy mypy, we know this is not None because we passed PIPE
+        assert self._subprocess.stderr is not None
+        # Read stderr until we see "is available at" or the process has exited with an error
+        stderr = ""
+        while True:
+            result = self._subprocess.poll()
+            if result is not None:
+                stderr += self._subprocess.stderr.read()
+                raise ValueError(f"Jupyter gateway server failed to start with exit code: {result}. stderr:\n{stderr}")
+            line = self._subprocess.stderr.readline()
+            stderr += line
+
+            if "ERROR:" in line:
+                error_info = line.split("ERROR:")[1]
+                raise ValueError(f"Jupyter gateway server failed to start. {error_info}")
+
+            if "is available at" in line:
+                # We need to extract what port it settled on
+                # Example output:
+                #   Jupyter Kernel Gateway 3.0.0 is available at http://127.0.0.1:8890
+                if port is None:
+                    port = int(line.split(":")[-1])
+                self.port: int = port
+
+                break
+
+        # Poll the subprocess to check if it is still running
+        result = self._subprocess.poll()
+        if result is not None:
+            raise ValueError(
+                f"Jupyter gateway server failed to start. Please check the logs ({log_file}) for more information."
+            )
+
+        atexit.register(self.stop)
+
+    def stop(self) -> None:
+        if self._subprocess.poll() is None:
+            if sys.platform == "win32":
+                self._subprocess.send_signal(signal.CTRL_C_EVENT)
+            else:
+                self._subprocess.send_signal(signal.SIGINT)
+            self._subprocess.wait()
+
+    @property
+    def connection_info(self) -> JupyterConnectionInfo:
+        return JupyterConnectionInfo(host=self.ip, use_https=False, port=self.port, token=self.token)
+
+    def get_client(self) -> JupyterClient:
+        return JupyterClient(self.connection_info)
+
+    def __enter__(self) -> Self:
+        return self
+
+    def __exit__(
+        self, exc_type: Optional[type[BaseException]], exc_val: Optional[BaseException], exc_tb: Optional[TracebackType]
+    ) -> None:
+        self.stop()
diff --git a/mm_agents/coact/autogen/coding/local_commandline_code_executor.py b/mm_agents/coact/autogen/coding/local_commandline_code_executor.py
new file mode 100644
index 0000000..e1306dd
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/local_commandline_code_executor.py
@@ -0,0 +1,405 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import logging
+import os
+import re
+import subprocess
+import sys
+import warnings
+from hashlib import md5
+from pathlib import Path
+from string import Template
+from types import SimpleNamespace
+from typing import Any, Callable, ClassVar, Optional, Union
+
+from typing_extensions import ParamSpec
+
+from ..code_utils import PYTHON_VARIANTS, TIMEOUT_MSG, WIN32, _cmd
+from ..doc_utils import export_module
+from .base import CodeBlock, CodeExecutor, CodeExtractor, CommandLineCodeResult
+from .func_with_reqs import (
+    FunctionWithRequirements,
+    FunctionWithRequirementsStr,
+    _build_python_functions_file,
+    to_stub,
+)
+from .markdown_code_extractor import MarkdownCodeExtractor
+from .utils import _get_file_name_from_content, silence_pip
+
+__all__ = ("LocalCommandLineCodeExecutor",)
+
+A = ParamSpec("A")
+
+
+@export_module("autogen.coding")
+class LocalCommandLineCodeExecutor(CodeExecutor):
+    SUPPORTED_LANGUAGES: ClassVar[list[str]] = [
+        "bash",
+        "shell",
+        "sh",
+        "pwsh",
+        "powershell",
+        "ps1",
+        "python",
+        "javascript",
+        "html",
+        "css",
+    ]
+    DEFAULT_EXECUTION_POLICY: ClassVar[dict[str, bool]] = {
+        "bash": True,
+        "shell": True,
+        "sh": True,
+        "pwsh": True,
+        "powershell": True,
+        "ps1": True,
+        "python": True,
+        "javascript": False,
+        "html": False,
+        "css": False,
+    }
+
+    FUNCTION_PROMPT_TEMPLATE: ClassVar[
+        str
+    ] = """You have access to the following user defined functions. They can be accessed from the module called `$module_name` by their function names.
+
+For example, if there was a function called `foo` you could import it by writing `from $module_name import foo`
+
+$functions"""
+
+    def __init__(
+        self,
+        timeout: int = 60,
+        virtual_env_context: Optional[SimpleNamespace] = None,
+        work_dir: Union[Path, str] = Path(),
+        functions: list[Union[FunctionWithRequirements[Any, A], Callable[..., Any], FunctionWithRequirementsStr]] = [],
+        functions_module: str = "functions",
+        execution_policies: Optional[dict[str, bool]] = None,
+    ):
+        """(Experimental) A code executor class that executes or saves LLM generated code a local command line
+        environment.
+
+        **This will execute or save LLM generated code on the local machine.**
+
+        Each code block is saved as a file in the working directory. Depending on the execution policy,
+        the code may be executed in a separate process.
+        The code blocks are executed or save in the order they are received.
+        Command line code is sanitized against a list of dangerous commands to prevent self-destructive commands from being executed,
+        which could potentially affect the user's environment. Supported languages include Python, shell scripts (bash, shell, sh),
+        PowerShell (pwsh, powershell, ps1), HTML, CSS, and JavaScript.
+        Execution policies determine whether each language's code blocks are executed or saved only.
+
+        ## Execution with a Python virtual environment
+        A python virtual env can be used to execute code and install dependencies. This has the added benefit of not polluting the
+        base environment with unwanted modules.
+        ```python
+        from autogen.code_utils import create_virtual_env
+        from autogen.coding import LocalCommandLineCodeExecutor
+
+        venv_dir = ".venv"
+        venv_context = create_virtual_env(venv_dir)
+
+        executor = LocalCommandLineCodeExecutor(virtual_env_context=venv_context)
+        ```
+
+        Args:
+            timeout (int): The timeout for code execution, default is 60 seconds.
+            virtual_env_context (Optional[SimpleNamespace]): The virtual environment context to use.
+            work_dir (Union[Path, str]): The working directory for code execution, defaults to the current directory.
+            functions (List[Union[FunctionWithRequirements[Any, A], Callable[..., Any], FunctionWithRequirementsStr]]): A list of callable functions available to the executor.
+            functions_module (str): The module name under which functions are accessible.
+            execution_policies (Optional[Dict[str, bool]]): A dictionary mapping languages to execution policies (True for execution, False for saving only). Defaults to class-wide DEFAULT_EXECUTION_POLICY.
+        """
+        if timeout < 1:
+            raise ValueError("Timeout must be greater than or equal to 1.")
+
+        if isinstance(work_dir, str):
+            work_dir = Path(work_dir)
+
+        if not functions_module.isidentifier():
+            raise ValueError("Module name must be a valid Python identifier")
+
+        self._functions_module = functions_module
+
+        work_dir.mkdir(exist_ok=True)
+
+        self._timeout = timeout
+        self._work_dir: Path = work_dir
+        self._virtual_env_context: Optional[SimpleNamespace] = virtual_env_context
+
+        self._functions = functions
+        # Setup could take some time so we intentionally wait for the first code block to do it.
+        if len(functions) > 0:
+            self._setup_functions_complete = False
+        else:
+            self._setup_functions_complete = True
+
+        self.execution_policies = self.DEFAULT_EXECUTION_POLICY.copy()
+        if execution_policies is not None:
+            self.execution_policies.update(execution_policies)
+
+    def format_functions_for_prompt(self, prompt_template: str = FUNCTION_PROMPT_TEMPLATE) -> str:
+        """(Experimental) Format the functions for a prompt.
+
+        The template includes two variables:
+        - `$module_name`: The module name.
+        - `$functions`: The functions formatted as stubs with two newlines between each function.
+
+        Args:
+            prompt_template (str): The prompt template. Default is the class default.
+
+        Returns:
+            str: The formatted prompt.
+        """
+        template = Template(prompt_template)
+        return template.substitute(
+            module_name=self._functions_module,
+            functions="\n\n".join([to_stub(func) for func in self._functions]),
+        )
+
+    @property
+    def functions_module(self) -> str:
+        """(Experimental) The module name for the functions."""
+        return self._functions_module
+
+    @property
+    def functions(
+        self,
+    ) -> list[Union[FunctionWithRequirements[Any, A], Callable[..., Any], FunctionWithRequirementsStr]]:
+        """(Experimental) The functions that are available to the code executor."""
+        return self._functions
+
+    @property
+    def timeout(self) -> int:
+        """(Experimental) The timeout for code execution."""
+        return self._timeout
+
+    @property
+    def work_dir(self) -> Path:
+        """(Experimental) The working directory for the code execution."""
+        return self._work_dir
+
+    @property
+    def code_extractor(self) -> CodeExtractor:
+        """(Experimental) Export a code extractor that can be used by an agent."""
+        return MarkdownCodeExtractor()
+
+    @staticmethod
+    def sanitize_command(lang: str, code: str) -> None:
+        """Sanitize the code block to prevent dangerous commands.
+        This approach acknowledges that while Docker or similar
+        containerization/sandboxing technologies provide a robust layer of security,
+        not all users may have Docker installed or may choose not to use it.
+        Therefore, having a baseline level of protection helps mitigate risks for users who,
+        either out of choice or necessity, run code outside of a sandboxed environment.
+        """
+        dangerous_patterns = [
+            (r"\brm\s+-rf\b", "Use of 'rm -rf' command is not allowed."),
+            (r"\bmv\b.*?\s+/dev/null", "Moving files to /dev/null is not allowed."),
+            (r"\bdd\b", "Use of 'dd' command is not allowed."),
+            (r">\s*/dev/sd[a-z][1-9]?", "Overwriting disk blocks directly is not allowed."),
+            (r":\(\)\{\s*:\|\:&\s*\};:", "Fork bombs are not allowed."),
+        ]
+        if lang in ["bash", "shell", "sh"]:
+            for pattern, message in dangerous_patterns:
+                if re.search(pattern, code):
+                    raise ValueError(f"Potentially dangerous command detected: {message}")
+
+    def _setup_functions(self) -> None:
+        func_file_content = _build_python_functions_file(self._functions)
+        func_file = self._work_dir / f"{self._functions_module}.py"
+        func_file.write_text(func_file_content)
+
+        # Collect requirements
+        lists_of_packages = [x.python_packages for x in self._functions if isinstance(x, FunctionWithRequirements)]
+        flattened_packages = [item for sublist in lists_of_packages for item in sublist]
+        required_packages = list(set(flattened_packages))
+        if len(required_packages) > 0:
+            logging.info("Ensuring packages are installed in executor.")
+            py_executable = self._virtual_env_context.env_exe if self._virtual_env_context else sys.executable
+            cmd = [py_executable, "-m", "pip", "install"] + required_packages
+            try:
+                result = subprocess.run(
+                    cmd,
+                    cwd=self._work_dir,
+                    capture_output=True,
+                    text=True,
+                    timeout=float(self._timeout),
+                    encoding="utf-8",
+                )
+            except subprocess.TimeoutExpired as e:
+                raise ValueError("Pip install timed out") from e
+            if result.returncode != 0:
+                raise ValueError(f"Pip install failed. {result.stdout}, {result.stderr}")
+        # Attempt to load the function file to check for syntax errors, imports etc.
+        exec_result = self._execute_code_dont_check_setup([CodeBlock(code=func_file_content, language="python")])
+        if exec_result.exit_code != 0:
+            raise ValueError(f"Functions failed to load: {exec_result.output}")
+        self._setup_functions_complete = True
+
+    def execute_code_blocks(self, code_blocks: list[CodeBlock]) -> CommandLineCodeResult:
+        """(Experimental) Execute the code blocks and return the result.
+
+        Args:
+            code_blocks (List[CodeBlock]): The code blocks to execute.
+
+        Returns:
+            CommandLineCodeResult: The result of the code execution.
+        """
+        if not self._setup_functions_complete:
+            self._setup_functions()
+        return self._execute_code_dont_check_setup(code_blocks)
+
+    def _execute_code_dont_check_setup(self, code_blocks: list[CodeBlock]) -> CommandLineCodeResult:
+        logs_all = ""
+        file_names = []
+        for code_block in code_blocks:
+            lang, code = code_block.language, code_block.code
+            lang = lang.lower()
+
+            LocalCommandLineCodeExecutor.sanitize_command(lang, code)
+            code = silence_pip(code, lang)
+
+            if lang in PYTHON_VARIANTS:
+                lang = "python"
+
+            if WIN32 and lang in ["sh", "shell"]:
+                lang = "ps1"
+
+            if lang not in self.SUPPORTED_LANGUAGES:
+                # In case the language is not supported, we return an error message.
+                exitcode = 1
+                logs_all += "\n" + f"unknown language {lang}"
+                break
+
+            execute_code = self.execution_policies.get(lang, False)
+            try:
+                # Check if there is a filename comment
+                filename = _get_file_name_from_content(code, self._work_dir)
+            except ValueError:
+                return CommandLineCodeResult(exit_code=1, output="Filename is not in the workspace")
+
+            if filename is None:
+                # create a file with an automatically generated name
+                code_hash = md5(code.encode()).hexdigest()
+                filename = f"tmp_code_{code_hash}.{'py' if lang.startswith('python') else lang}"
+            written_file = (self._work_dir / filename).resolve()
+            with written_file.open("w", encoding="utf-8") as f:
+                f.write(code)
+            file_names.append(written_file)
+
+            if not execute_code:
+                # Just return a message that the file is saved.
+                logs_all += f"Code saved to {written_file!s}\n"
+                exitcode = 0
+                continue
+
+            program = _cmd(lang)
+            cmd = [program, str(written_file.absolute())]
+            env = os.environ.copy()
+
+            if self._virtual_env_context:
+                virtual_env_abs_path = os.path.abspath(self._virtual_env_context.bin_path)
+                path_with_virtualenv = rf"{virtual_env_abs_path}{os.pathsep}{env['PATH']}"
+                env["PATH"] = path_with_virtualenv
+                if WIN32:
+                    activation_script = os.path.join(virtual_env_abs_path, "activate.bat")
+                    cmd = [activation_script, "&&", *cmd]
+
+            try:
+                result = subprocess.run(
+                    cmd,
+                    cwd=self._work_dir,
+                    capture_output=True,
+                    text=True,
+                    timeout=float(self._timeout),
+                    env=env,
+                    encoding="utf-8",
+                )
+            except subprocess.TimeoutExpired:
+                logs_all += "\n" + TIMEOUT_MSG
+                # Same exit code as the timeout command on linux.
+                exitcode = 124
+                break
+
+            logs_all += result.stderr
+            logs_all += result.stdout
+            exitcode = result.returncode
+
+            if exitcode != 0:
+                break
+
+        code_file = str(file_names[0]) if len(file_names) > 0 else None
+        return CommandLineCodeResult(exit_code=exitcode, output=logs_all, code_file=code_file)
+
+    def restart(self) -> None:
+        """(Experimental) Restart the code executor."""
+        warnings.warn("Restarting local command line code executor is not supported. No action is taken.")
+
+
+# From stack overflow: https://stackoverflow.com/a/52087847/2214524
+class _DeprecatedClassMeta(type):
+    def __new__(cls, name, bases, classdict, *args, **kwargs):  # type: ignore[no-untyped-def]
+        alias = classdict.get("_DeprecatedClassMeta__alias")
+
+        if alias is not None:
+
+            def new(cls, *args, **kwargs):  # type: ignore[no-untyped-def]
+                alias = cls._DeprecatedClassMeta__alias
+
+                if alias is not None:
+                    warnings.warn(
+                        f"{cls.__name__} has been renamed to {alias.__name__}, the alias will be removed in the future",
+                        DeprecationWarning,
+                        stacklevel=2,
+                    )
+
+                return alias(*args, **kwargs)
+
+            classdict["__new__"] = new
+            classdict["_DeprecatedClassMeta__alias"] = alias
+
+        fixed_bases = []
+
+        for b in bases:
+            alias = getattr(b, "_DeprecatedClassMeta__alias", None)
+
+            if alias is not None:
+                warnings.warn(
+                    f"{b.__name__} has been renamed to {alias.__name__}, the alias will be removed in the future",
+                    DeprecationWarning,
+                    stacklevel=2,
+                )
+
+            # Avoid duplicate base classes.
+            b = alias or b
+            if b not in fixed_bases:
+                fixed_bases.append(b)
+
+        fixed_bases = tuple(fixed_bases)  # type: ignore[assignment]
+
+        return super().__new__(cls, name, fixed_bases, classdict, *args, **kwargs)  # type: ignore[call-overload]
+
+    def __instancecheck__(cls, instance):  # type: ignore[no-untyped-def]
+        return any(cls.__subclasscheck__(c) for c in {type(instance), instance.__class__})  # type: ignore[no-untyped-call]
+
+    def __subclasscheck__(cls, subclass):  # type: ignore[no-untyped-def]
+        if subclass is cls:
+            return True
+        else:
+            return issubclass(subclass, cls._DeprecatedClassMeta__alias)  # type: ignore[attr-defined]
+
+
+class LocalCommandlineCodeExecutor(metaclass=_DeprecatedClassMeta):
+    """LocalCommandlineCodeExecutor renamed to LocalCommandLineCodeExecutor"""
+
+    _DeprecatedClassMeta__alias = LocalCommandLineCodeExecutor
+
+
+class CommandlineCodeResult(metaclass=_DeprecatedClassMeta):
+    """CommandlineCodeResult renamed to CommandLineCodeResult"""
+
+    _DeprecatedClassMeta__alias = CommandLineCodeResult
diff --git a/mm_agents/coact/autogen/coding/markdown_code_extractor.py b/mm_agents/coact/autogen/coding/markdown_code_extractor.py
new file mode 100644
index 0000000..6e8a856
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/markdown_code_extractor.py
@@ -0,0 +1,45 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import re
+from typing import Union
+
+from ..code_utils import CODE_BLOCK_PATTERN, UNKNOWN, content_str, infer_lang
+from ..doc_utils import export_module
+from ..types import UserMessageImageContentPart, UserMessageTextContentPart
+from .base import CodeBlock, CodeExtractor
+
+__all__ = ("MarkdownCodeExtractor",)
+
+
+@export_module("autogen.coding")
+class MarkdownCodeExtractor(CodeExtractor):
+    """(Experimental) A class that extracts code blocks from a message using Markdown syntax."""
+
+    def extract_code_blocks(
+        self, message: Union[str, list[Union[UserMessageTextContentPart, UserMessageImageContentPart]], None]
+    ) -> list[CodeBlock]:
+        """(Experimental) Extract code blocks from a message. If no code blocks are found,
+        return an empty list.
+
+        Args:
+            message (str): The message to extract code blocks from.
+
+        Returns:
+            List[CodeBlock]: The extracted code blocks or an empty list.
+        """
+        text = content_str(message)
+        match = re.findall(CODE_BLOCK_PATTERN, text, flags=re.DOTALL)
+        if not match:
+            return []
+        code_blocks = []
+        for lang, code in match:
+            if lang == "":
+                lang = infer_lang(code)
+            if lang == UNKNOWN:
+                lang = ""
+            code_blocks.append(CodeBlock(code=code, language=lang))
+        return code_blocks
diff --git a/mm_agents/coact/autogen/coding/utils.py b/mm_agents/coact/autogen/coding/utils.py
new file mode 100644
index 0000000..1fa0a14
--- /dev/null
+++ b/mm_agents/coact/autogen/coding/utils.py
@@ -0,0 +1,56 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/ag2ai/ag2 are under the MIT License.
+# SPDX-License-Identifier: MIT
+# Will return the filename relative to the workspace path
+import re
+from pathlib import Path
+from typing import Optional
+
+filename_patterns = [
+    re.compile(r"^<!-- (filename:)?(.+?) -->", re.DOTALL),
+    re.compile(r"^/\* (filename:)?(.+?) \*/", re.DOTALL),
+    re.compile(r"^// (filename:)?(.+?)$", re.DOTALL),
+    re.compile(r"^# (filename:)?(.+?)$", re.DOTALL),
+]
+
+
+# Raises ValueError if the file is not in the workspace
+def _get_file_name_from_content(code: str, workspace_path: Path) -> Optional[str]:
+    first_line = code.split("\n")[0].strip()
+    # TODO - support other languages
+    for pattern in filename_patterns:
+        matches = pattern.match(first_line)
+        if matches is not None:
+            filename = matches.group(2).strip()
+
+            # Handle relative paths in the filename
+            path = Path(filename)
+            if not path.is_absolute():
+                path = workspace_path / path
+            path = path.resolve()
+            # Throws an error if the file is not in the workspace
+            relative = path.relative_to(workspace_path.resolve())
+            return str(relative)
+    return None
+
+
+def silence_pip(code: str, lang: str) -> str:
+    """Apply -qqq flag to pip install commands."""
+    if lang == "python":
+        regex = r"^! ?pip install"
+    elif lang in ["bash", "shell", "sh", "pwsh", "powershell", "ps1"]:
+        regex = r"^pip install"
+    else:
+        return code
+
+    # Find lines that start with pip install and make sure "-qqq" flag is added.
+    lines = code.split("\n")
+    for i, line in enumerate(lines):
+        # use regex to find lines that start with pip install.
+        match = re.search(regex, line)
+        if match is not None and "-qqq" not in line:
+            lines[i] = line.replace(match.group(0), match.group(0) + " -qqq")
+    return "\n".join(lines)
diff --git a/mm_agents/coact/autogen/doc_utils.py b/mm_agents/coact/autogen/doc_utils.py
new file mode 100644
index 0000000..74da77d
--- /dev/null
+++ b/mm_agents/coact/autogen/doc_utils.py
@@ -0,0 +1,34 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+__all__ = ["export_module"]
+
+from typing import Callable, Optional, TypeVar
+
+T = TypeVar("T")
+
+# Global dictionary to store export module mappings
+# Key: original symbol name (qualified by module)
+# Value: target module where it should be documented
+_PDOC_MODULE_EXPORT_MAPPINGS: dict[str, str] = {}
+
+
+def export_module(module: str) -> Callable[[T], T]:
+    def decorator(cls: T) -> T:
+        original_module = getattr(cls, "__module__", None)
+        if original_module:
+            fqn = f"{original_module}.{cls.__name__}"
+            _PDOC_MODULE_EXPORT_MAPPINGS[fqn] = module
+        return cls
+
+    return decorator
+
+
+def get_target_module(obj: object) -> Optional[str]:
+    """Get the target module where an object should be documented."""
+    if not hasattr(obj, "__module__"):
+        return None
+
+    fqn = f"{obj.__module__}.{obj.__name__}"
+    return _PDOC_MODULE_EXPORT_MAPPINGS.get(fqn)
diff --git a/mm_agents/coact/autogen/events/__init__.py b/mm_agents/coact/autogen/events/__init__.py
new file mode 100644
index 0000000..be83a3d
--- /dev/null
+++ b/mm_agents/coact/autogen/events/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+from .base_event import BaseEvent, get_annotated_type_for_event_classes, wrap_event
+from .helpers import deprecated_by
+
+__all__ = ["BaseEvent", "deprecated_by", "get_annotated_type_for_event_classes", "wrap_event"]
diff --git a/mm_agents/coact/autogen/events/agent_events.py b/mm_agents/coact/autogen/events/agent_events.py
new file mode 100644
index 0000000..cf9d12f
--- /dev/null
+++ b/mm_agents/coact/autogen/events/agent_events.py
@@ -0,0 +1,1014 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from abc import ABC
+from copy import deepcopy
+from typing import TYPE_CHECKING, Any, Callable, Literal, Optional, Union
+from uuid import UUID
+import re
+
+from pydantic import BaseModel, field_validator, model_serializer
+from termcolor import colored
+
+from autogen.agentchat.group import ContextVariables
+
+from ..agentchat.agent import LLMMessageType
+from ..code_utils import content_str
+from ..import_utils import optional_import_block, require_optional_import
+from ..oai.client import OpenAIWrapper
+from .base_event import BaseEvent, wrap_event
+
+with optional_import_block() as result:
+    from PIL.Image import Image
+
+IS_PIL_AVAILABLE = result.is_successful
+
+if TYPE_CHECKING:
+    from ..agentchat.agent import Agent
+    from ..coding.base import CodeBlock
+
+
+__all__ = [
+    "ClearAgentsHistoryEvent",
+    "ClearConversableAgentHistoryEvent",
+    "ConversableAgentUsageSummaryEvent",
+    "ConversableAgentUsageSummaryNoCostIncurredEvent",
+    "ExecuteCodeBlockEvent",
+    "ExecuteFunctionEvent",
+    "FunctionCallEvent",
+    "FunctionResponseEvent",
+    "GenerateCodeExecutionReplyEvent",
+    "GroupChatResumeEvent",
+    "GroupChatRunChatEvent",
+    "PostCarryoverProcessingEvent",
+    "SelectSpeakerEvent",
+    "SpeakerAttemptFailedMultipleAgentsEvent",
+    "SpeakerAttemptFailedNoAgentsEvent",
+    "SpeakerAttemptSuccessfulEvent",
+    "TerminationAndHumanReplyNoInputEvent",
+    "TerminationEvent",
+    "TextEvent",
+    "ToolCallEvent",
+    "ToolResponseEvent",
+]
+
+EventRole = Literal["assistant", "function", "tool"]
+
+
+class BasePrintReceivedEvent(BaseEvent, ABC):
+    content: Union[str, int, float, bool]
+    sender: str
+    recipient: str
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        f(f"{colored(self.sender, 'yellow')} (to {self.recipient}):\n", flush=True)
+
+
+@wrap_event
+class FunctionResponseEvent(BasePrintReceivedEvent):
+    name: Optional[str] = None
+    role: EventRole = "function"
+    content: Union[str, int, float, bool]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        id = self.name or "No id found"
+        func_print = f"***** Response from calling {self.role} ({id}) *****"
+        f(colored(func_print, "green"), flush=True)
+        f(self.content, flush=True)
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+class ToolResponse(BaseModel):
+    tool_call_id: Optional[str] = None
+    role: EventRole = "tool"
+    content: Union[str, int, float, bool]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        id = self.tool_call_id or "No id found"
+        tool_print = f"***** Response from calling {self.role} ({id}) *****"
+        f(colored(tool_print, "green"), flush=True)
+        f(re.sub(r'<img[^>]*>', '<image>', self.content), flush=True)
+        f(colored("*" * len(tool_print), "green"), flush=True)
+
+
+@wrap_event
+class ToolResponseEvent(BasePrintReceivedEvent):
+    role: EventRole = "tool"
+    tool_responses: list[ToolResponse]
+    content: Optional[Union[str, int, float, bool, list[dict[str, Any]]]]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        for tool_response in self.tool_responses:
+            tool_response.print(f)
+            f("\n", "-" * 80, flush=True, sep="")
+
+
+class FunctionCall(BaseModel):
+    name: Optional[str] = None
+    arguments: Optional[str] = None
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        name = self.name or "(No function name found)"
+        arguments = self.arguments or "(No arguments found)"
+
+        func_print = f"***** Suggested function call: {name} *****"
+        f(colored(func_print, "green"), flush=True)
+        f(
+            "Arguments: \n",
+            arguments,
+            flush=True,
+            sep="",
+        )
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+
+@wrap_event
+class FunctionCallEvent(BasePrintReceivedEvent):
+    content: Optional[Union[str, int, float, bool]] = None  # type: ignore [assignment]
+    function_call: FunctionCall
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(self.content, flush=True)
+
+        self.function_call.print(f)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+class ToolCall(BaseModel):
+    id: Optional[str] = None
+    function: FunctionCall
+    type: str
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        id = self.id or "No tool call id found"
+
+        name = self.function.name or "(No function name found)"
+        arguments = self.function.arguments or "(No arguments found)"
+
+        func_print = f"***** Suggested tool call ({id}): {name} *****"
+        f(colored(func_print, "green"), flush=True)
+        f(
+            "Arguments: \n",
+            arguments,
+            flush=True,
+            sep="",
+        )
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+
+@wrap_event
+class ToolCallEvent(BasePrintReceivedEvent):
+    content: Optional[Union[str, int, float, bool, list[dict[str, Any]]]] = None  # type: ignore [assignment]
+    refusal: Optional[str] = None
+    role: Optional[EventRole] = None
+    audio: Optional[str] = None
+    function_call: Optional[FunctionCall] = None
+    tool_calls: list[ToolCall]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(self.content[0]['text'], flush=True)
+
+        for tool_call in self.tool_calls:
+            tool_call.print(f)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+@wrap_event
+class TextEvent(BasePrintReceivedEvent):
+    content: Optional[Union[str, int, float, bool, list[dict[str, Union[str, Union[str, dict[str, Any]]]]]]] = None  # type: ignore [assignment]
+
+    @classmethod
+    @require_optional_import("PIL", "unknown")
+    def _replace_pil_image_with_placeholder(cls, item: dict[str, Any], key: str) -> None:
+        if isinstance(item[key], Image):
+            item[key] = "<image>"
+
+    @field_validator("content", mode="before")
+    @classmethod
+    def validate_and_encode_content(
+        cls, content: Optional[Union[str, int, float, bool, list[dict[str, Union[str, dict[str, Any]]]]]]
+    ) -> Optional[Union[str, int, float, bool, list[dict[str, Union[str, dict[str, Any]]]]]]:
+        if not IS_PIL_AVAILABLE:
+            return content
+
+        if not isinstance(content, list):
+            return content
+
+        for item in content:
+            if isinstance(item, dict) and "image_url" in item:
+                cls._replace_pil_image_with_placeholder(item, "image_url")
+
+        return content
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(content_str(self.content), flush=True)  # type: ignore [arg-type]
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+def create_received_event_model(
+    *, uuid: Optional[UUID] = None, event: dict[str, Any], sender: "Agent", recipient: "Agent"
+) -> Union[FunctionResponseEvent, ToolResponseEvent, FunctionCallEvent, ToolCallEvent, TextEvent]:
+    role = event.get("role")
+    if role == "function":
+        return FunctionResponseEvent(**event, sender=sender.name, recipient=recipient.name, uuid=uuid)
+    if role == "tool":
+        return ToolResponseEvent(**event, sender=sender.name, recipient=recipient.name, uuid=uuid)
+
+    # Role is neither function nor tool
+
+    if event.get("function_call"):
+        return FunctionCallEvent(
+            **event,
+            sender=sender.name,
+            recipient=recipient.name,
+            uuid=uuid,
+        )
+
+    if event.get("tool_calls"):
+        return ToolCallEvent(
+            **event,
+            sender=sender.name,
+            recipient=recipient.name,
+            uuid=uuid,
+        )
+
+    # Now message is a simple content message
+    content = event.get("content")
+    allow_format_str_template = (
+        recipient.llm_config.get("allow_format_str_template", False) if recipient.llm_config else False  # type: ignore [attr-defined]
+    )
+    if content is not None and "context" in event:
+        content = OpenAIWrapper.instantiate(
+            content,  # type: ignore [arg-type]
+            event["context"],
+            allow_format_str_template,
+        )
+
+    return TextEvent(
+        content=content,
+        sender=sender.name,
+        recipient=recipient.name,
+        uuid=uuid,
+    )
+
+
+@wrap_event
+class PostCarryoverProcessingEvent(BaseEvent):
+    carryover: Union[str, list[Union[str, dict[str, Any], Any]]]
+    message: str
+    verbose: bool = False
+
+    sender: str
+    recipient: str
+    summary_method: str
+    summary_args: Optional[dict[str, Any]] = None
+    max_turns: Optional[int] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, chat_info: dict[str, Any]):
+        carryover = chat_info.get("carryover", "")
+        message = chat_info.get("message")
+        verbose = chat_info.get("verbose", False)
+
+        sender = chat_info["sender"].name if hasattr(chat_info["sender"], "name") else chat_info["sender"]
+        recipient = chat_info["recipient"].name if hasattr(chat_info["recipient"], "name") else chat_info["recipient"]
+        summary_args = chat_info.get("summary_args")
+        max_turns = chat_info.get("max_turns")
+
+        # Fix Callable in chat_info
+        summary_method = chat_info.get("summary_method", "")
+        if callable(summary_method):
+            summary_method = summary_method.__name__
+
+        print_message = ""
+        if isinstance(message, str):
+            print_message = message
+        elif callable(message):
+            print_message = "Callable: " + message.__name__
+        elif isinstance(message, dict):
+            print_message = "Dict: " + str(message)
+        elif message is None:
+            print_message = "None"
+
+        super().__init__(
+            uuid=uuid,
+            carryover=carryover,
+            message=print_message,
+            verbose=verbose,
+            summary_method=summary_method,
+            summary_args=summary_args,
+            max_turns=max_turns,
+            sender=sender,
+            recipient=recipient,
+        )
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "chat_info": {
+                "carryover": self.carryover,
+                "message": self.message,
+                "verbose": self.verbose,
+                "sender": self.sender,
+                "recipient": self.recipient,
+                "summary_method": self.summary_method,
+                "summary_args": self.summary_args,
+                "max_turns": self.max_turns,
+            },
+        }
+
+    def _process_carryover(self) -> str:
+        if not isinstance(self.carryover, list):
+            return self.carryover
+
+        print_carryover = []
+        for carryover_item in self.carryover:
+            if isinstance(carryover_item, str):
+                print_carryover.append(carryover_item)
+            elif isinstance(carryover_item, dict) and "content" in carryover_item:
+                print_carryover.append(str(carryover_item["content"]))
+            else:
+                print_carryover.append(str(carryover_item))
+
+        return ("\n").join(print_carryover)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        print_carryover = self._process_carryover()
+
+        f(colored("\n" + "*" * 80, "blue"), flush=True, sep="")
+        f(
+            colored(
+                "Starting a new chat....",
+                "blue",
+            ),
+            flush=True,
+        )
+        if self.verbose:
+            f(colored("Event:\n" + self.message, "blue"), flush=True)
+            f(colored("Carryover:\n" + print_carryover, "blue"), flush=True)
+        f(colored("\n" + "*" * 80, "blue"), flush=True, sep="")
+
+
+@wrap_event
+class ClearAgentsHistoryEvent(BaseEvent):
+    agent: Optional[str] = None
+    nr_events_to_preserve: Optional[int] = None
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        agent: Optional[Union["Agent", str]] = None,
+        nr_events_to_preserve: Optional[int] = None,
+    ):
+        return super().__init__(
+            uuid=uuid,
+            agent=agent.name if hasattr(agent, "name") else agent,
+            nr_events_to_preserve=nr_events_to_preserve,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        if self.agent:
+            if self.nr_events_to_preserve:
+                f(f"Clearing history for {self.agent} except last {self.nr_events_to_preserve} events.")
+            else:
+                f(f"Clearing history for {self.agent}.")
+        else:
+            if self.nr_events_to_preserve:
+                f(f"Clearing history for all agents except last {self.nr_events_to_preserve} events.")
+            else:
+                f("Clearing history for all agents.")
+
+
+# todo: break into multiple events
+@wrap_event
+class SpeakerAttemptSuccessfulEvent(BaseEvent):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "mentions": self.mentions,
+            "attempt": self.attempt,
+            "attempts_left": self.attempts_left,
+            "select_speaker_auto_verbose": self.verbose,
+        }
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        selected_agent_name = next(iter(self.mentions))
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt {self.attempt} of {self.attempt + self.attempts_left} successfully selected: {selected_agent_name}",
+                "green",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class SpeakerAttemptFailedMultipleAgentsEvent(BaseEvent):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "mentions": self.mentions,
+            "attempt": self.attempt,
+            "attempts_left": self.attempts_left,
+            "select_speaker_auto_verbose": self.verbose,
+        }
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt {self.attempt} of {self.attempt + self.attempts_left} failed as it included multiple agent names.",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class SpeakerAttemptFailedNoAgentsEvent(BaseEvent):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "mentions": self.mentions,
+            "attempt": self.attempt,
+            "attempts_left": self.attempts_left,
+            "select_speaker_auto_verbose": self.verbose,
+        }
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt #{self.attempt} failed as it did not include any agent names.",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class GroupChatResumeEvent(BaseEvent):
+    last_speaker_name: str
+    events: list[LLMMessageType]
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        last_speaker_name: str,
+        events: list["LLMMessageType"],
+        silent: Optional[bool] = False,
+    ):
+        super().__init__(uuid=uuid, last_speaker_name=last_speaker_name, events=events, verbose=not silent)
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "last_speaker_name": self.last_speaker_name,
+            "events": self.events,
+            "silent": not self.verbose,
+        }
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            f"Prepared group chat with {len(self.events)} events, the last speaker is",
+            colored(self.last_speaker_name, "yellow"),
+            flush=True,
+        )
+
+
+@wrap_event
+class GroupChatRunChatEvent(BaseEvent):
+    speaker: str
+    verbose: Optional[bool] = False
+
+    def __init__(self, *, uuid: Optional[UUID] = None, speaker: Union["Agent", str], silent: Optional[bool] = False):
+        super().__init__(uuid=uuid, speaker=speaker.name if hasattr(speaker, "name") else speaker, verbose=not silent)
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {"uuid": self.uuid, "speaker": self.speaker, "silent": not self.verbose}
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\nNext speaker: {self.speaker}\n", "green"), flush=True)
+
+
+@wrap_event
+class TerminationAndHumanReplyNoInputEvent(BaseEvent):
+    """When the human-in-the-loop is prompted but provides no input."""
+
+    no_human_input_msg: str
+    sender: str
+    recipient: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        no_human_input_msg: str,
+        sender: Optional[Union["Agent", str]] = None,
+        recipient: Union["Agent", str],
+    ):
+        sender = sender or "No sender"
+        super().__init__(
+            uuid=uuid,
+            no_human_input_msg=no_human_input_msg,
+            sender=sender.name if hasattr(sender, "name") else sender,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\n>>>>>>>> {self.no_human_input_msg}", "red"), flush=True)
+
+
+@wrap_event
+class UsingAutoReplyEvent(BaseEvent):
+    human_input_mode: str
+    sender: str
+    recipient: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        human_input_mode: str,
+        sender: Optional[Union["Agent", str]] = None,
+        recipient: Union["Agent", str],
+    ):
+        sender = sender or "No sender"
+        super().__init__(
+            uuid=uuid,
+            human_input_mode=human_input_mode,
+            sender=sender.name if hasattr(sender, "name") else sender,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored("\n>>>>>>>> USING AUTO REPLY...", "red"), flush=True)
+
+
+@wrap_event
+class TerminationEvent(BaseEvent):
+    """When a workflow termination condition is met"""
+
+    termination_reason: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        termination_reason: str,
+    ):
+        super().__init__(
+            uuid=uuid,
+            termination_reason=termination_reason,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\n>>>>>>>> TERMINATING RUN ({str(self.uuid)}): {self.termination_reason}", "red"), flush=True)
+
+
+@wrap_event
+class ExecuteCodeBlockEvent(BaseEvent):
+    code: str
+    language: str
+    code_block_count: int
+    recipient: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        code: str,
+        language: str,
+        code_block_count: int,
+        recipient: Union["Agent", str],
+    ):
+        super().__init__(
+            uuid=uuid,
+            code=code,
+            language=language,
+            code_block_count=code_block_count,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTING CODE BLOCK {self.code_block_count} (inferred language is {self.language})...",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class ExecuteFunctionEvent(BaseEvent):
+    func_name: str
+    call_id: Optional[str] = None
+    arguments: dict[str, Any]
+    recipient: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        func_name: str,
+        call_id: Optional[str] = None,
+        arguments: dict[str, Any],
+        recipient: Union["Agent", str],
+    ):
+        super().__init__(
+            uuid=uuid,
+            func_name=func_name,
+            call_id=call_id,
+            arguments=arguments,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTING FUNCTION {self.func_name}...\nCall ID: {self.call_id}\nInput arguments: {self.arguments}",
+                "magenta",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class ExecutedFunctionEvent(BaseEvent):
+    func_name: str
+    call_id: Optional[str] = None
+    arguments: Optional[dict[str, Any]]
+    content: Any
+    recipient: str
+    is_exec_success: bool = True
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        func_name: str,
+        call_id: Optional[str] = None,
+        arguments: Optional[dict[str, Any]],
+        content: Any,
+        recipient: Union["Agent", str],
+        is_exec_success: bool = True,
+    ):
+        super().__init__(
+            uuid=uuid,
+            func_name=func_name,
+            call_id=call_id,
+            arguments=arguments,
+            content=content,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+        self.is_exec_success = is_exec_success
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTED FUNCTION {self.func_name}...\nCall ID: {self.call_id}\nInput arguments: {self.arguments}\nOutput:\n{re.sub(r'<img[^>]*>', '<image>', self.content)}",
+                "magenta",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class SelectSpeakerEvent(BaseEvent):
+    agents: Optional[list[str]] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, agents: Optional[list[Union["Agent", str]]] = None):
+        agents = [agent.name if hasattr(agent, "name") else agent for agent in agents] if agents else None
+        super().__init__(uuid=uuid, agents=agents)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f("Please select the next speaker from the following list:")
+        agents = self.agents or []
+        for i, agent in enumerate(agents):
+            f(f"{i + 1}: {agent}")
+
+
+@wrap_event
+class SelectSpeakerTryCountExceededEvent(BaseEvent):
+    try_count: int
+    agents: Optional[list[str]] = None
+
+    def __init__(
+        self, *, uuid: Optional[UUID] = None, try_count: int, agents: Optional[list[Union["Agent", str]]] = None
+    ):
+        agents = [agent.name if hasattr(agent, "name") else agent for agent in agents] if agents else None
+        super().__init__(uuid=uuid, try_count=try_count, agents=agents)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"You have tried {self.try_count} times. The next speaker will be selected automatically.")
+
+
+@wrap_event
+class SelectSpeakerInvalidInputEvent(BaseEvent):
+    agents: Optional[list[str]] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, agents: Optional[list[Union["Agent", str]]] = None):
+        agents = [agent.name if hasattr(agent, "name") else agent for agent in agents] if agents else None
+        super().__init__(uuid=uuid, agents=agents)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"Invalid input. Please enter a number between 1 and {len(self.agents or [])}.")
+
+
+@wrap_event
+class ClearConversableAgentHistoryEvent(BaseEvent):
+    agent: str
+    recipient: str
+    no_events_preserved: int
+
+    def __init__(
+        self, *, uuid: Optional[UUID] = None, agent: Union["Agent", str], no_events_preserved: Optional[int] = None
+    ):
+        super().__init__(
+            uuid=uuid,
+            agent=agent.name if hasattr(agent, "name") else agent,
+            recipient=agent.name if hasattr(agent, "name") else agent,
+            no_events_preserved=no_events_preserved,
+        )
+
+    @model_serializer
+    def serialize_model(self) -> dict[str, Any]:
+        return {
+            "uuid": self.uuid,
+            "agent": self.agent,
+            "no_events_preserved": self.no_events_preserved,
+        }
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        for _ in range(self.no_events_preserved):
+            f(f"Preserving one more event for {self.agent} to not divide history between tool call and tool response.")
+
+
+@wrap_event
+class ClearConversableAgentHistoryWarningEvent(BaseEvent):
+    recipient: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: Union["Agent", str]):
+        super().__init__(
+            uuid=uuid,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                "WARNING: `nr_preserved_events` is ignored when clearing chat history with a specific agent.",
+                "yellow",
+            ),
+            flush=True,
+        )
+
+
+@wrap_event
+class GenerateCodeExecutionReplyEvent(BaseEvent):
+    code_blocks: list[str]
+    sender: str
+    recipient: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        code_blocks: list[Union["CodeBlock", str]],
+        sender: Optional[Union["Agent", str]] = None,
+        recipient: Union["Agent", str],
+    ):
+        code_blocks = [
+            code_block.language if hasattr(code_block, "language") else code_block for code_block in code_blocks
+        ]
+        sender = sender or "No sender"
+
+        super().__init__(
+            uuid=uuid,
+            code_blocks=code_blocks,
+            sender=sender.name if hasattr(sender, "name") else sender,
+            recipient=recipient.name if hasattr(recipient, "name") else recipient,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        num_code_blocks = len(self.code_blocks)
+        if num_code_blocks == 1:
+            f(
+                colored(
+                    f"\n>>>>>>>> EXECUTING CODE BLOCK (inferred language is {self.code_blocks[0]})...",
+                    "red",
+                ),
+                flush=True,
+            )
+        else:
+            f(
+                colored(
+                    f"\n>>>>>>>> EXECUTING {num_code_blocks} CODE BLOCKS (inferred languages are [{', '.join([x for x in self.code_blocks])}])...",
+                    "red",
+                ),
+                flush=True,
+            )
+
+
+@wrap_event
+class ConversableAgentUsageSummaryNoCostIncurredEvent(BaseEvent):
+    recipient: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: Union["Agent", str]):
+        super().__init__(uuid=uuid, recipient=recipient.name if hasattr(recipient, "name") else recipient)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"No cost incurred from agent '{self.recipient}'.")
+
+
+@wrap_event
+class ConversableAgentUsageSummaryEvent(BaseEvent):
+    recipient: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: Union["Agent", str]):
+        super().__init__(uuid=uuid, recipient=recipient.name if hasattr(recipient, "name") else recipient)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"Agent '{self.recipient}':")
+
+
+@wrap_event
+class InputRequestEvent(BaseEvent):
+    prompt: str
+    password: bool = False
+    respond: Optional[Callable[[str], None]] = None
+
+    type: str = "input_request"
+
+
+@wrap_event
+class AsyncInputRequestEvent(BaseEvent):
+    prompt: str
+    password: bool = False
+
+    async def a_respond(self, response: "InputResponseEvent") -> None:
+        pass
+
+
+@wrap_event
+class InputResponseEvent(BaseEvent):
+    value: str
+
+
+@wrap_event
+class ErrorEvent(BaseEvent):
+    error: Any
+
+
+@wrap_event
+class RunCompletionEvent(BaseEvent):
+    summary: str
+    history: list[LLMMessageType]
+    cost: dict[str, Any]
+    last_speaker: Optional[str]
+    context_variables: Optional[ContextVariables] = None
diff --git a/mm_agents/coact/autogen/events/base_event.py b/mm_agents/coact/autogen/events/base_event.py
new file mode 100644
index 0000000..b74e3c6
--- /dev/null
+++ b/mm_agents/coact/autogen/events/base_event.py
@@ -0,0 +1,99 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+from abc import ABC
+from typing import Annotated, Any, Callable, Literal, Optional, Union
+from uuid import UUID, uuid4
+
+from pydantic import BaseModel, Field, create_model
+
+from ..doc_utils import export_module
+
+__all__ = ["BaseEvent", "get_annotated_type_for_event_classes", "get_event_classes", "wrap_event"]
+
+
+@export_module("autogen.events")
+class BaseEvent(BaseModel, ABC):
+    uuid: UUID
+
+    def __init__(self, uuid: Optional[UUID] = None, **kwargs: Any) -> None:
+        uuid = uuid or uuid4()
+        super().__init__(uuid=uuid, **kwargs)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        """Print event
+
+        Args:
+            f (Optional[Callable[..., Any]], optional): Print function. If none, python's default print will be used.
+        """
+        ...
+
+
+def camel2snake(name: str) -> str:
+    return "".join(["_" + i.lower() if i.isupper() else i for i in name]).lstrip("_")
+
+
+_event_classes: dict[str, type[BaseModel]] = {}
+
+
+@export_module("autogen.events")
+def wrap_event(event_cls: type[BaseEvent]) -> type[BaseModel]:
+    """Wrap a event class with a type field to be used in a union type
+
+    This is needed for proper serialization and deserialization of events in a union type.
+
+    Args:
+        event_cls (type[BaseEvent]): Event class to wrap
+    """
+    global _event_classes
+
+    if not event_cls.__name__.endswith("Event"):
+        raise ValueError("Event class name must end with 'Event'")
+
+    type_name = camel2snake(event_cls.__name__)
+    type_name = type_name[: -len("_event")]
+
+    class WrapperBase(BaseModel):
+        # these types are generated dynamically so we need to disable the type checker
+        type: Literal[type_name] = type_name  # type: ignore[valid-type]
+        content: event_cls  # type: ignore[valid-type]
+
+        def __init__(self, *args: Any, **data: Any):
+            if set(data.keys()) == {"type", "content"} and "content" in data:
+                super().__init__(*args, **data)
+            else:
+                if "content" in data:
+                    content = data.pop("content")
+                    super().__init__(*args, content=event_cls(*args, **data, content=content), **data)
+                else:
+                    super().__init__(content=event_cls(*args, **data), **data)
+
+        def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+            self.content.print(f)  # type: ignore[attr-defined]
+
+    wrapper_cls = create_model(event_cls.__name__, __base__=WrapperBase)
+
+    # Preserve the original class's docstring and other attributes
+    wrapper_cls.__doc__ = event_cls.__doc__
+    wrapper_cls.__module__ = event_cls.__module__
+
+    # Copy any other relevant attributes/metadata from the original class
+    if hasattr(event_cls, "__annotations__"):
+        wrapper_cls.__annotations__ = event_cls.__annotations__
+
+    _event_classes[type_name] = wrapper_cls
+
+    return wrapper_cls
+
+
+@export_module("autogen.events")
+def get_annotated_type_for_event_classes() -> type[Any]:
+    # this is a dynamic type so we need to disable the type checker
+    union_type = Union[tuple(_event_classes.values())]  # type: ignore[valid-type]
+    return Annotated[union_type, Field(discriminator="type")]  # type: ignore[return-value]
+
+
+def get_event_classes() -> dict[str, type[BaseModel]]:
+    return _event_classes
diff --git a/mm_agents/coact/autogen/events/client_events.py b/mm_agents/coact/autogen/events/client_events.py
new file mode 100644
index 0000000..c7e7a6e
--- /dev/null
+++ b/mm_agents/coact/autogen/events/client_events.py
@@ -0,0 +1,167 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Callable, Literal, Optional, Union
+from uuid import UUID
+
+from pydantic import BaseModel
+
+from .base_event import BaseEvent, wrap_event
+
+__all__ = ["UsageSummaryEvent"]
+
+
+class ModelUsageSummary(BaseModel):
+    """Model usage summary."""
+
+    model: str
+    """Model name."""
+    completion_tokens: int
+    """Number of tokens used for completion."""
+    cost: float
+    """Cost of the completion."""
+    prompt_tokens: int
+    """Number of tokens used for prompt."""
+    total_tokens: int
+    """Total number of tokens used."""
+
+
+class ActualUsageSummary(BaseModel):
+    """Actual usage summary."""
+
+    usages: Optional[list[ModelUsageSummary]] = None
+    """List of model usage summaries."""
+    total_cost: Optional[float] = None
+    """Total cost."""
+
+
+class TotalUsageSummary(BaseModel):
+    """Total usage summary."""
+
+    usages: Optional[list[ModelUsageSummary]] = None
+    """List of model usage summaries."""
+    total_cost: Optional[float] = None
+    """Total cost."""
+
+
+Mode = Literal["both", "total", "actual"]
+
+
+def _change_usage_summary_format(
+    actual_usage_summary: Optional[dict[str, Any]] = None, total_usage_summary: Optional[dict[str, Any]] = None
+) -> dict[str, dict[str, Any]]:
+    summary: dict[str, Any] = {}
+
+    for usage_type, usage_summary in {"actual": actual_usage_summary, "total": total_usage_summary}.items():
+        if usage_summary is None:
+            summary[usage_type] = {"usages": None, "total_cost": None}
+            continue
+
+        usage_summary_altered_format: dict[str, list[dict[str, Any]]] = {"usages": []}
+        for k, v in usage_summary.items():
+            if isinstance(k, str) and isinstance(v, dict):
+                current_usage = {key: value for key, value in v.items()}
+                current_usage["model"] = k
+                usage_summary_altered_format["usages"].append(current_usage)
+            else:
+                usage_summary_altered_format[k] = v
+        summary[usage_type] = usage_summary_altered_format
+
+    return summary
+
+
+@wrap_event
+class UsageSummaryEvent(BaseEvent):
+    """Usage summary message."""
+
+    actual: ActualUsageSummary
+    """Actual usage summary."""
+    total: TotalUsageSummary
+    """Total usage summary."""
+    mode: Mode
+    """Mode to display the usage summary."""
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        actual_usage_summary: Optional[dict[str, Any]] = None,
+        total_usage_summary: Optional[dict[str, Any]] = None,
+        mode: Mode = "both",
+    ):
+        # print(f"{actual_usage_summary=}")
+        # print(f"{total_usage_summary=}")
+
+        summary_dict = _change_usage_summary_format(actual_usage_summary, total_usage_summary)
+
+        super().__init__(uuid=uuid, **summary_dict, mode=mode)
+
+    def _print_usage(
+        self,
+        usage_summary: Union[ActualUsageSummary, TotalUsageSummary],
+        usage_type: str = "total",
+        f: Optional[Callable[..., Any]] = None,
+    ) -> None:
+        f = f or print
+        word_from_type = "including" if usage_type == "total" else "excluding"
+        if usage_summary.usages is None or len(usage_summary.usages) == 0:
+            f("No actual cost incurred (all completions are using cache).", flush=True)
+            return
+
+        f(f"Usage summary {word_from_type} cached usage: ", flush=True)
+        f(f"Total cost: {round(usage_summary.total_cost, 5)}", flush=True)  # type: ignore [arg-type]
+
+        for usage in usage_summary.usages:
+            f(
+                f"* Model '{usage.model}': cost: {round(usage.cost, 5)}, prompt_tokens: {usage.prompt_tokens}, completion_tokens: {usage.completion_tokens}, total_tokens: {usage.total_tokens}",
+                flush=True,
+            )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        if self.total.usages is None:
+            f('No usage summary. Please call "create" first.', flush=True)
+            return
+
+        f("-" * 100, flush=True)
+        if self.mode == "both":
+            self._print_usage(self.actual, "actual", f)
+            f()
+            if self.total.model_dump_json() != self.actual.model_dump_json():
+                self._print_usage(self.total, "total", f)
+            else:
+                f(
+                    "All completions are non-cached: the total cost with cached completions is the same as actual cost.",
+                    flush=True,
+                )
+        elif self.mode == "total":
+            self._print_usage(self.total, "total", f)
+        elif self.mode == "actual":
+            self._print_usage(self.actual, "actual", f)
+        else:
+            raise ValueError(f'Invalid mode: {self.mode}, choose from "actual", "total", ["actual", "total"]')
+        f("-" * 100, flush=True)
+
+
+@wrap_event
+class StreamEvent(BaseEvent):
+    """Stream event."""
+
+    content: str
+    """Content of the event."""
+
+    def __init__(self, *, uuid: Optional[UUID] = None, content: str) -> None:
+        super().__init__(uuid=uuid, content=content)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        # Set the terminal text color to green
+        f("\033[32m", end="")
+
+        f(self.content, end="", flush=True)
+
+        # Reset the terminal text color
+        f("\033[0m\n")
diff --git a/mm_agents/coact/autogen/events/helpers.py b/mm_agents/coact/autogen/events/helpers.py
new file mode 100644
index 0000000..541f684
--- /dev/null
+++ b/mm_agents/coact/autogen/events/helpers.py
@@ -0,0 +1,36 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+import logging
+from functools import wraps
+from typing import Callable
+
+from pydantic import BaseModel
+
+logger = logging.getLogger(__name__)
+
+
+def deprecated_by(
+    new_class: type[BaseModel],
+    param_mapping: dict[str, str] = None,
+) -> Callable[[type[BaseModel]], Callable[..., BaseModel]]:
+    param_mapping = param_mapping or {}
+
+    def decorator(
+        old_class: type[BaseModel],
+        param_mapping: dict[str, str] = param_mapping,
+    ) -> Callable[..., BaseModel]:
+        @wraps(old_class)
+        def wrapper(*args, **kwargs) -> BaseModel:
+            logger.warning(
+                f"{old_class.__name__} is deprecated by {new_class.__name__}. Please import it from {new_class.__module__} and use it instead."
+            )
+            # Translate old parameters to new parameters
+            new_kwargs = {param_mapping.get(k, k): v for k, v in kwargs.items()}
+
+            # Pass the translated parameters to the new class
+            return new_class(*args, **new_kwargs)
+
+        return wrapper
+
+    return decorator
diff --git a/mm_agents/coact/autogen/events/print_event.py b/mm_agents/coact/autogen/events/print_event.py
new file mode 100644
index 0000000..6d4aa54
--- /dev/null
+++ b/mm_agents/coact/autogen/events/print_event.py
@@ -0,0 +1,46 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import json
+from typing import Any, Callable, Optional
+from uuid import UUID
+
+from .base_event import BaseEvent, wrap_event
+
+
+@wrap_event
+class PrintEvent(BaseEvent):
+    """Print message"""
+
+    objects: list[str]
+    """List of objects to print"""
+    sep: str
+    """Separator between objects"""
+    end: str
+    """End of the print"""
+
+    def __init__(
+        self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False, uuid: Optional[UUID] = None
+    ):
+        objects_as_string = [self._to_json(x) for x in objects]
+
+        super().__init__(uuid=uuid, objects=objects_as_string, sep=sep, end=end)
+
+    def _to_json(self, obj: Any) -> str:
+        if isinstance(obj, str):
+            return obj
+
+        if hasattr(obj, "model_dump_json"):
+            return obj.model_dump_json()  # type: ignore [no-any-return]
+        try:
+            return json.dumps(obj)
+        except Exception:
+            return str(obj)
+            # return repr(obj)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(*self.objects, sep=self.sep, end=self.end, flush=True)
diff --git a/mm_agents/coact/autogen/exception_utils.py b/mm_agents/coact/autogen/exception_utils.py
new file mode 100644
index 0000000..0c60d52
--- /dev/null
+++ b/mm_agents/coact/autogen/exception_utils.py
@@ -0,0 +1,73 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import Any
+
+from .doc_utils import export_module
+
+__all__ = [
+    "AgentNameConflictError",
+    "InvalidCarryOverTypeError",
+    "ModelToolNotSupportedError",
+    "NoEligibleSpeakerError",
+    "SenderRequiredError",
+    "UndefinedNextAgentError",
+]
+
+
+@export_module("autogen")
+class AgentNameConflictError(Exception):  # noqa: N818
+    def __init__(self, msg: str = "Found multiple agents with the same name.", *args: Any, **kwargs: Any):
+        super().__init__(msg, *args, **kwargs)
+
+
+@export_module("autogen")
+class NoEligibleSpeakerError(Exception):  # noqa: N818
+    """Exception raised for early termination of a GroupChat."""
+
+    def __init__(self, message: str = "No eligible speakers."):
+        self.message = message
+        super().__init__(self.message)
+
+
+@export_module("autogen")
+class SenderRequiredError(Exception):  # noqa: N818
+    """Exception raised when the sender is required but not provided."""
+
+    def __init__(self, message: str = "Sender is required but not provided."):
+        self.message = message
+        super().__init__(self.message)
+
+
+@export_module("autogen")
+class InvalidCarryOverTypeError(Exception):  # noqa: N818
+    """Exception raised when the carryover type is invalid."""
+
+    def __init__(
+        self, message: str = "Carryover should be a string or a list of strings. Not adding carryover to the message."
+    ):
+        self.message = message
+        super().__init__(self.message)
+
+
+@export_module("autogen")
+class UndefinedNextAgentError(Exception):  # noqa: N818
+    """Exception raised when the provided next agents list does not overlap with agents in the group."""
+
+    def __init__(self, message: str = "The provided agents list does not overlap with agents in the group."):
+        self.message = message
+        super().__init__(self.message)
+
+
+class ModelToolNotSupportedError(Exception):
+    """Exception raised when attempting to use tools with models that do not support them."""
+
+    def __init__(
+        self,
+        model: str,
+    ):
+        self.message = f"Tools are not supported with {model} models. Refer to the documentation at https://platform.openai.com/docs/guides/reasoning#limitations"
+        super().__init__(self.message)
diff --git a/mm_agents/coact/autogen/fast_depends/__init__.py b/mm_agents/coact/autogen/fast_depends/__init__.py
new file mode 100644
index 0000000..8e9fc0f
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/__init__.py
@@ -0,0 +1,16 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .dependencies import Provider, dependency_provider
+from .use import Depends, inject
+
+__all__ = (
+    "Depends",
+    "Provider",
+    "dependency_provider",
+    "inject",
+)
diff --git a/mm_agents/coact/autogen/fast_depends/_compat.py b/mm_agents/coact/autogen/fast_depends/_compat.py
new file mode 100644
index 0000000..f8bb469
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/_compat.py
@@ -0,0 +1,80 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import sys
+from importlib.metadata import version as get_version
+from typing import Any, Dict, Optional, Tuple, Type
+
+from pydantic import BaseModel, create_model
+from pydantic.version import VERSION as PYDANTIC_VERSION
+
+__all__ = (
+    "PYDANTIC_V2",
+    "BaseModel",
+    "ConfigDict",
+    "ExceptionGroup",
+    "create_model",
+    "evaluate_forwardref",
+    "get_config_base",
+)
+
+
+PYDANTIC_V2 = PYDANTIC_VERSION.startswith("2.")
+
+default_pydantic_config = {"arbitrary_types_allowed": True}
+
+evaluate_forwardref: Any
+# isort: off
+if PYDANTIC_V2:
+    from pydantic import ConfigDict
+    from pydantic._internal._typing_extra import (  # type: ignore[no-redef]
+        eval_type_lenient as evaluate_forwardref,
+    )
+
+    def model_schema(model: Type[BaseModel]) -> Dict[str, Any]:
+        return model.model_json_schema()
+
+    def get_config_base(config_data: Optional[ConfigDict] = None) -> ConfigDict:
+        return config_data or ConfigDict(**default_pydantic_config)  # type: ignore[typeddict-item]
+
+    def get_aliases(model: Type[BaseModel]) -> Tuple[str, ...]:
+        return tuple(f.alias or name for name, f in model.model_fields.items())
+
+    class CreateBaseModel(BaseModel):
+        """Just to support FastStream < 0.3.7."""
+
+        model_config = ConfigDict(arbitrary_types_allowed=True)
+
+else:
+    from pydantic.typing import evaluate_forwardref as evaluate_forwardref  # type: ignore[no-redef]
+    from pydantic.config import get_config, ConfigDict, BaseConfig
+
+    def get_config_base(config_data: Optional[ConfigDict] = None) -> Type[BaseConfig]:  # type: ignore[misc,no-any-unimported]
+        return get_config(config_data or ConfigDict(**default_pydantic_config))  # type: ignore[typeddict-item,no-any-unimported,no-any-return]
+
+    def model_schema(model: Type[BaseModel]) -> Dict[str, Any]:
+        return model.schema()
+
+    def get_aliases(model: Type[BaseModel]) -> Tuple[str, ...]:
+        return tuple(f.alias or name for name, f in model.__fields__.items())  # type: ignore[attr-defined]
+
+    class CreateBaseModel(BaseModel):  # type: ignore[no-redef]
+        """Just to support FastStream < 0.3.7."""
+
+        class Config:
+            arbitrary_types_allowed = True
+
+
+ANYIO_V3 = get_version("anyio").startswith("3.")
+
+if ANYIO_V3:
+    from anyio import ExceptionGroup as ExceptionGroup  # type: ignore[attr-defined]
+else:
+    if sys.version_info < (3, 11):
+        from exceptiongroup import ExceptionGroup as ExceptionGroup
+    else:
+        ExceptionGroup = ExceptionGroup
diff --git a/mm_agents/coact/autogen/fast_depends/core/__init__.py b/mm_agents/coact/autogen/fast_depends/core/__init__.py
new file mode 100644
index 0000000..861a304
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/core/__init__.py
@@ -0,0 +1,14 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .build import build_call_model
+from .model import CallModel
+
+__all__ = (
+    "CallModel",
+    "build_call_model",
+)
diff --git a/mm_agents/coact/autogen/fast_depends/core/build.py b/mm_agents/coact/autogen/fast_depends/core/build.py
new file mode 100644
index 0000000..e8f3016
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/core/build.py
@@ -0,0 +1,225 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import inspect
+from copy import deepcopy
+from typing import (
+    Any,
+    Awaitable,
+    Callable,
+    Dict,
+    List,
+    Optional,
+    Sequence,
+    Tuple,
+    Type,
+    TypeVar,
+    Union,
+)
+
+from typing_extensions import (
+    Annotated,
+    ParamSpec,
+    get_args,
+    get_origin,
+)
+
+from .._compat import ConfigDict, create_model, get_config_base
+from ..dependencies import Depends
+from ..library import CustomField
+from ..utils import (
+    get_typed_signature,
+    is_async_gen_callable,
+    is_coroutine_callable,
+    is_gen_callable,
+)
+from .model import CallModel, ResponseModel
+
+CUSTOM_ANNOTATIONS = (Depends, CustomField)
+
+
+P = ParamSpec("P")
+T = TypeVar("T")
+
+
+def build_call_model(
+    call: Union[
+        Callable[P, T],
+        Callable[P, Awaitable[T]],
+    ],
+    *,
+    cast: bool = True,
+    use_cache: bool = True,
+    is_sync: Optional[bool] = None,
+    extra_dependencies: Sequence[Depends] = (),
+    pydantic_config: Optional[ConfigDict] = None,
+) -> CallModel[P, T]:
+    name = getattr(call, "__name__", type(call).__name__)
+
+    is_call_async = is_coroutine_callable(call) or is_async_gen_callable(call)
+    if is_sync is None:
+        is_sync = not is_call_async
+    else:
+        assert not (is_sync and is_call_async), f"You cannot use async dependency `{name}` at sync main"
+
+    typed_params, return_annotation = get_typed_signature(call)
+    if (is_call_generator := is_gen_callable(call) or is_async_gen_callable(call)) and (
+        return_args := get_args(return_annotation)
+    ):
+        return_annotation = return_args[0]
+
+    class_fields: Dict[str, Tuple[Any, Any]] = {}
+    dependencies: Dict[str, CallModel[..., Any]] = {}
+    custom_fields: Dict[str, CustomField] = {}
+    positional_args: List[str] = []
+    keyword_args: List[str] = []
+    var_positional_arg: Optional[str] = None
+    var_keyword_arg: Optional[str] = None
+
+    for param_name, param in typed_params.parameters.items():
+        dep: Optional[Depends] = None
+        custom: Optional[CustomField] = None
+
+        if param.annotation is inspect.Parameter.empty:
+            annotation = Any
+
+        elif get_origin(param.annotation) is Annotated:
+            annotated_args = get_args(param.annotation)
+            type_annotation = annotated_args[0]
+
+            custom_annotations = []
+            regular_annotations = []
+            for arg in annotated_args[1:]:
+                if isinstance(arg, CUSTOM_ANNOTATIONS):
+                    custom_annotations.append(arg)
+                else:
+                    regular_annotations.append(arg)
+
+            assert len(custom_annotations) <= 1, (
+                f"Cannot specify multiple `Annotated` Custom arguments for `{param_name}`!"
+            )
+
+            next_custom = next(iter(custom_annotations), None)
+            if next_custom is not None:
+                if isinstance(next_custom, Depends):
+                    dep = next_custom
+                elif isinstance(next_custom, CustomField):
+                    custom = deepcopy(next_custom)
+                else:  # pragma: no cover
+                    raise AssertionError("unreachable")
+
+                annotation = param.annotation if regular_annotations else type_annotation
+            else:
+                annotation = param.annotation
+        else:
+            annotation = param.annotation
+
+        default: Any
+        if param.kind == inspect.Parameter.VAR_POSITIONAL:
+            default = ()
+            var_positional_arg = param_name
+        elif param.kind == inspect.Parameter.VAR_KEYWORD:
+            default = {}
+            var_keyword_arg = param_name
+        elif param.default is inspect.Parameter.empty:
+            default = Ellipsis
+        else:
+            default = param.default
+
+        if isinstance(default, Depends):
+            assert not dep, "You can not use `Depends` with `Annotated` and default both"
+            dep, default = default, Ellipsis
+
+        elif isinstance(default, CustomField):
+            assert not custom, "You can not use `CustomField` with `Annotated` and default both"
+            custom, default = default, Ellipsis
+
+        else:
+            class_fields[param_name] = (annotation, default)
+
+        if dep:
+            if not cast:
+                dep.cast = False
+
+            dependencies[param_name] = build_call_model(
+                dep.dependency,
+                cast=dep.cast,
+                use_cache=dep.use_cache,
+                is_sync=is_sync,
+                pydantic_config=pydantic_config,
+            )
+
+            if dep.cast is True:
+                class_fields[param_name] = (annotation, Ellipsis)
+
+            keyword_args.append(param_name)
+
+        elif custom:
+            assert not (is_sync and is_coroutine_callable(custom.use)), (
+                f"You cannot use async custom field `{type(custom).__name__}` at sync `{name}`"
+            )
+
+            custom.set_param_name(param_name)
+            custom_fields[param_name] = custom
+
+            if custom.cast is False:
+                annotation = Any
+
+            if custom.required:
+                class_fields[param_name] = (annotation, default)
+
+            else:
+                class_fields[param_name] = class_fields.get(param_name, (Optional[annotation], None))
+
+            keyword_args.append(param_name)
+
+        else:
+            if param.kind is param.KEYWORD_ONLY:
+                keyword_args.append(param_name)
+            elif param.kind not in (inspect.Parameter.VAR_POSITIONAL, inspect.Parameter.VAR_KEYWORD):
+                positional_args.append(param_name)
+
+    func_model = create_model(  # type: ignore[call-overload]
+        name,
+        __config__=get_config_base(pydantic_config),
+        **class_fields,
+    )
+
+    response_model: Optional[Type[ResponseModel[T]]] = None
+    if cast and return_annotation and return_annotation is not inspect.Parameter.empty:
+        response_model = create_model(  # type: ignore[call-overload,assignment]
+            "ResponseModel",
+            __config__=get_config_base(pydantic_config),
+            response=(return_annotation, Ellipsis),
+        )
+
+    return CallModel(
+        call=call,
+        model=func_model,
+        response_model=response_model,
+        params=class_fields,
+        cast=cast,
+        use_cache=use_cache,
+        is_async=is_call_async,
+        is_generator=is_call_generator,
+        dependencies=dependencies,
+        custom_fields=custom_fields,
+        positional_args=positional_args,
+        keyword_args=keyword_args,
+        var_positional_arg=var_positional_arg,
+        var_keyword_arg=var_keyword_arg,
+        extra_dependencies=[
+            build_call_model(
+                d.dependency,
+                cast=d.cast,
+                use_cache=d.use_cache,
+                is_sync=is_sync,
+                pydantic_config=pydantic_config,
+            )
+            for d in extra_dependencies
+        ],
+    )
diff --git a/mm_agents/coact/autogen/fast_depends/core/model.py b/mm_agents/coact/autogen/fast_depends/core/model.py
new file mode 100644
index 0000000..f2a4d84
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/core/model.py
@@ -0,0 +1,576 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from collections import namedtuple
+from contextlib import AsyncExitStack, ExitStack
+from functools import partial
+from inspect import Parameter, unwrap
+from itertools import chain
+from typing import (
+    Any,
+    Awaitable,
+    Callable,
+    Dict,
+    Generator,
+    Generic,
+    Iterable,
+    List,
+    Optional,
+    Sequence,
+    Tuple,
+    Type,
+    TypeVar,
+    Union,
+)
+
+import anyio
+from typing_extensions import ParamSpec
+
+from .._compat import BaseModel, ExceptionGroup, get_aliases
+from ..library import CustomField
+from ..utils import (
+    async_map,
+    is_async_gen_callable,
+    is_coroutine_callable,
+    is_gen_callable,
+    run_async,
+    solve_generator_async,
+    solve_generator_sync,
+)
+
+P = ParamSpec("P")
+T = TypeVar("T")
+
+
+PriorityPair = namedtuple("PriorityPair", ("call", "dependencies_number", "dependencies_names"))
+
+
+class ResponseModel(BaseModel, Generic[T]):
+    response: T
+
+
+class CallModel(Generic[P, T]):
+    call: Union[
+        Callable[P, T],
+        Callable[P, Awaitable[T]],
+    ]
+    is_async: bool
+    is_generator: bool
+    model: Optional[Type[BaseModel]]
+    response_model: Optional[Type[ResponseModel[T]]]
+
+    params: Dict[str, Tuple[Any, Any]]
+    alias_arguments: Tuple[str, ...]
+
+    dependencies: Dict[str, "CallModel[..., Any]"]
+    extra_dependencies: Iterable["CallModel[..., Any]"]
+    sorted_dependencies: Tuple[Tuple["CallModel[..., Any]", int], ...]
+    custom_fields: Dict[str, CustomField]
+    keyword_args: Tuple[str, ...]
+    positional_args: Tuple[str, ...]
+    var_positional_arg: Optional[str]
+    var_keyword_arg: Optional[str]
+
+    # Dependencies and custom fields
+    use_cache: bool
+    cast: bool
+
+    __slots__ = (
+        "call",
+        "is_async",
+        "is_generator",
+        "model",
+        "response_model",
+        "params",
+        "alias_arguments",
+        "keyword_args",
+        "positional_args",
+        "var_positional_arg",
+        "var_keyword_arg",
+        "dependencies",
+        "extra_dependencies",
+        "sorted_dependencies",
+        "custom_fields",
+        "use_cache",
+        "cast",
+    )
+
+    @property
+    def call_name(self) -> str:
+        call = unwrap(self.call)
+        return getattr(call, "__name__", type(call).__name__)
+
+    @property
+    def flat_params(self) -> Dict[str, Tuple[Any, Any]]:
+        params = self.params
+        for d in (*self.dependencies.values(), *self.extra_dependencies):
+            params.update(d.flat_params)
+        return params
+
+    @property
+    def flat_dependencies(
+        self,
+    ) -> Dict[
+        Callable[..., Any],
+        Tuple[
+            "CallModel[..., Any]",
+            Tuple[Callable[..., Any], ...],
+        ],
+    ]:
+        flat: Dict[
+            Callable[..., Any],
+            Tuple[
+                CallModel[..., Any],
+                Tuple[Callable[..., Any], ...],
+            ],
+        ] = {}
+
+        for i in (*self.dependencies.values(), *self.extra_dependencies):
+            flat.update({
+                i.call: (
+                    i,
+                    tuple(j.call for j in i.dependencies.values()),
+                )
+            })
+
+            flat.update(i.flat_dependencies)
+
+        return flat
+
+    def __init__(
+        self,
+        /,
+        call: Union[
+            Callable[P, T],
+            Callable[P, Awaitable[T]],
+        ],
+        model: Optional[Type[BaseModel]],
+        params: Dict[str, Tuple[Any, Any]],
+        response_model: Optional[Type[ResponseModel[T]]] = None,
+        use_cache: bool = True,
+        cast: bool = True,
+        is_async: bool = False,
+        is_generator: bool = False,
+        dependencies: Optional[Dict[str, "CallModel[..., Any]"]] = None,
+        extra_dependencies: Optional[Iterable["CallModel[..., Any]"]] = None,
+        keyword_args: Optional[List[str]] = None,
+        positional_args: Optional[List[str]] = None,
+        var_positional_arg: Optional[str] = None,
+        var_keyword_arg: Optional[str] = None,
+        custom_fields: Optional[Dict[str, CustomField]] = None,
+    ):
+        self.call = call
+        self.model = model
+
+        if model:
+            self.alias_arguments = get_aliases(model)
+        else:  # pragma: no cover
+            self.alias_arguments = ()
+
+        self.keyword_args = tuple(keyword_args or ())
+        self.positional_args = tuple(positional_args or ())
+        self.var_positional_arg = var_positional_arg
+        self.var_keyword_arg = var_keyword_arg
+        self.response_model = response_model
+        self.use_cache = use_cache
+        self.cast = cast
+        self.is_async = is_async or is_coroutine_callable(call) or is_async_gen_callable(call)
+        self.is_generator = is_generator or is_gen_callable(call) or is_async_gen_callable(call)
+
+        self.dependencies = dependencies or {}
+        self.extra_dependencies = extra_dependencies or ()
+        self.custom_fields = custom_fields or {}
+
+        sorted_dep: List[CallModel[..., Any]] = []
+        flat = self.flat_dependencies
+        for calls in flat.values():
+            _sort_dep(sorted_dep, calls, flat)
+
+        self.sorted_dependencies = tuple((i, len(i.sorted_dependencies)) for i in sorted_dep if i.use_cache)
+        for name in chain(self.dependencies.keys(), self.custom_fields.keys()):
+            params.pop(name, None)
+        self.params = params
+
+    def _solve(
+        self,
+        /,
+        *args: Tuple[Any, ...],
+        cache_dependencies: Dict[
+            Union[
+                Callable[P, T],
+                Callable[P, Awaitable[T]],
+            ],
+            T,
+        ],
+        dependency_overrides: Optional[
+            Dict[
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+            ]
+        ] = None,
+        **kwargs: Dict[str, Any],
+    ) -> Generator[
+        Tuple[
+            Sequence[Any],
+            Dict[str, Any],
+            Callable[..., Any],
+        ],
+        Any,
+        T,
+    ]:
+        if dependency_overrides:
+            call = dependency_overrides.get(self.call, self.call)
+            assert self.is_async or not is_coroutine_callable(call), (
+                f"You cannot use async dependency `{self.call_name}` at sync main"
+            )
+
+        else:
+            call = self.call
+
+        if self.use_cache and call in cache_dependencies:
+            return cache_dependencies[call]
+
+        kw: Dict[str, Any] = {}
+
+        for arg in self.keyword_args:
+            if (v := kwargs.pop(arg, Parameter.empty)) is not Parameter.empty:
+                kw[arg] = v
+
+        if self.var_keyword_arg is not None:
+            kw[self.var_keyword_arg] = kwargs
+        else:
+            kw.update(kwargs)
+
+        for arg in self.positional_args:
+            if args:
+                kw[arg], args = args[0], args[1:]
+            else:
+                break
+
+        keyword_args: Iterable[str]
+        if self.var_positional_arg is not None:
+            kw[self.var_positional_arg] = args
+            keyword_args = self.keyword_args
+
+        else:
+            keyword_args = self.keyword_args + self.positional_args
+            for arg in keyword_args:
+                if not self.cast and arg in self.params:
+                    kw[arg] = self.params[arg][1]
+
+                if not args:
+                    break
+
+                if arg not in self.dependencies:
+                    kw[arg], args = args[0], args[1:]
+
+        solved_kw: Dict[str, Any]
+        solved_kw = yield args, kw, call
+
+        args_: Sequence[Any]
+        if self.cast:
+            assert self.model, "Cast should be used only with model"
+            casted_model = self.model(**solved_kw)
+
+            kwargs_ = {arg: getattr(casted_model, arg, solved_kw.get(arg)) for arg in keyword_args}
+            if self.var_keyword_arg:
+                kwargs_.update(getattr(casted_model, self.var_keyword_arg, {}))
+
+            if self.var_positional_arg is not None:
+                args_ = [getattr(casted_model, arg, solved_kw.get(arg)) for arg in self.positional_args]
+                args_.extend(getattr(casted_model, self.var_positional_arg, ()))
+            else:
+                args_ = ()
+
+        else:
+            kwargs_ = {arg: solved_kw.get(arg) for arg in keyword_args}
+
+            args_ = tuple(map(solved_kw.get, self.positional_args)) if self.var_positional_arg is None else ()
+
+        response: T
+        response = yield args_, kwargs_, call
+
+        if self.cast and not self.is_generator:
+            response = self._cast_response(response)
+
+        if self.use_cache:  # pragma: no branch
+            cache_dependencies[call] = response
+
+        return response
+
+    def _cast_response(self, /, value: Any) -> Any:
+        if self.response_model is not None:
+            return self.response_model(response=value).response
+        else:
+            return value
+
+    def solve(
+        self,
+        /,
+        *args: Any,
+        stack: ExitStack,
+        cache_dependencies: Dict[
+            Union[
+                Callable[P, T],
+                Callable[P, Awaitable[T]],
+            ],
+            T,
+        ],
+        dependency_overrides: Optional[
+            Dict[
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+            ]
+        ] = None,
+        nested: bool = False,
+        **kwargs: Any,
+    ) -> T:
+        cast_gen = self._solve(
+            *args,
+            cache_dependencies=cache_dependencies,
+            dependency_overrides=dependency_overrides,
+            **kwargs,
+        )
+        try:
+            args, kwargs, _ = next(cast_gen)  # type: ignore[assignment]
+        except StopIteration as e:
+            cached_value: T = e.value
+            return cached_value
+
+        # Heat cache and solve extra dependencies
+        for dep, _ in self.sorted_dependencies:
+            dep.solve(
+                *args,
+                stack=stack,
+                cache_dependencies=cache_dependencies,
+                dependency_overrides=dependency_overrides,
+                nested=True,
+                **kwargs,
+            )
+
+        # Always get from cache
+        for dep in self.extra_dependencies:
+            dep.solve(
+                *args,
+                stack=stack,
+                cache_dependencies=cache_dependencies,
+                dependency_overrides=dependency_overrides,
+                nested=True,
+                **kwargs,
+            )
+
+        for dep_arg, dep in self.dependencies.items():
+            kwargs[dep_arg] = dep.solve(
+                stack=stack,
+                cache_dependencies=cache_dependencies,
+                dependency_overrides=dependency_overrides,
+                nested=True,
+                **kwargs,
+            )
+
+        for custom in self.custom_fields.values():
+            if custom.field:
+                custom.use_field(kwargs)
+            else:
+                kwargs = custom.use(**kwargs)
+
+        final_args, final_kwargs, call = cast_gen.send(kwargs)
+
+        if self.is_generator and nested:
+            response = solve_generator_sync(
+                *final_args,
+                call=call,
+                stack=stack,
+                **final_kwargs,
+            )
+
+        else:
+            response = call(*final_args, **final_kwargs)
+
+        try:
+            cast_gen.send(response)
+        except StopIteration as e:
+            value: T = e.value
+
+            if not self.cast or nested or not self.is_generator:
+                return value
+
+            else:
+                return map(self._cast_response, value)  # type: ignore[no-any-return, call-overload]
+
+        raise AssertionError("unreachable")
+
+    async def asolve(
+        self,
+        /,
+        *args: Any,
+        stack: AsyncExitStack,
+        cache_dependencies: Dict[
+            Union[
+                Callable[P, T],
+                Callable[P, Awaitable[T]],
+            ],
+            T,
+        ],
+        dependency_overrides: Optional[
+            Dict[
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+                Union[
+                    Callable[P, T],
+                    Callable[P, Awaitable[T]],
+                ],
+            ]
+        ] = None,
+        nested: bool = False,
+        **kwargs: Any,
+    ) -> T:
+        cast_gen = self._solve(
+            *args,
+            cache_dependencies=cache_dependencies,
+            dependency_overrides=dependency_overrides,
+            **kwargs,
+        )
+        try:
+            args, kwargs, _ = next(cast_gen)  # type: ignore[assignment]
+        except StopIteration as e:
+            cached_value: T = e.value
+            return cached_value
+
+        # Heat cache and solve extra dependencies
+        dep_to_solve: List[Callable[..., Awaitable[Any]]] = []
+        try:
+            async with anyio.create_task_group() as tg:
+                for dep, subdep in self.sorted_dependencies:
+                    solve = partial(
+                        dep.asolve,
+                        *args,
+                        stack=stack,
+                        cache_dependencies=cache_dependencies,
+                        dependency_overrides=dependency_overrides,
+                        nested=True,
+                        **kwargs,
+                    )
+                    if not subdep:
+                        tg.start_soon(solve)
+                    else:
+                        dep_to_solve.append(solve)
+        except ExceptionGroup as exgr:
+            for ex in exgr.exceptions:
+                raise ex from None
+
+        for i in dep_to_solve:
+            await i()
+
+        # Always get from cache
+        for dep in self.extra_dependencies:
+            await dep.asolve(
+                *args,
+                stack=stack,
+                cache_dependencies=cache_dependencies,
+                dependency_overrides=dependency_overrides,
+                nested=True,
+                **kwargs,
+            )
+
+        for dep_arg, dep in self.dependencies.items():
+            kwargs[dep_arg] = await dep.asolve(
+                stack=stack,
+                cache_dependencies=cache_dependencies,
+                dependency_overrides=dependency_overrides,
+                nested=True,
+                **kwargs,
+            )
+
+        custom_to_solve: List[CustomField] = []
+
+        try:
+            async with anyio.create_task_group() as tg:
+                for custom in self.custom_fields.values():
+                    if custom.field:
+                        tg.start_soon(run_async, custom.use_field, kwargs)
+                    else:
+                        custom_to_solve.append(custom)
+
+        except ExceptionGroup as exgr:
+            for ex in exgr.exceptions:
+                raise ex from None
+
+        for j in custom_to_solve:
+            kwargs = await run_async(j.use, **kwargs)
+
+        final_args, final_kwargs, call = cast_gen.send(kwargs)
+
+        if self.is_generator and nested:
+            response = await solve_generator_async(
+                *final_args,
+                call=call,
+                stack=stack,
+                **final_kwargs,
+            )
+        else:
+            response = await run_async(call, *final_args, **final_kwargs)
+
+        try:
+            cast_gen.send(response)
+        except StopIteration as e:
+            value: T = e.value
+
+            if not self.cast or nested or not self.is_generator:
+                return value
+
+            else:
+                return async_map(self._cast_response, value)  # type: ignore[return-value, arg-type]
+
+        raise AssertionError("unreachable")
+
+
+def _sort_dep(
+    collector: List["CallModel[..., Any]"],
+    items: Tuple[
+        "CallModel[..., Any]",
+        Tuple[Callable[..., Any], ...],
+    ],
+    flat: Dict[
+        Callable[..., Any],
+        Tuple[
+            "CallModel[..., Any]",
+            Tuple[Callable[..., Any], ...],
+        ],
+    ],
+) -> None:
+    model, calls = items
+
+    if model in collector:
+        return
+
+    if not calls:
+        position = -1
+
+    else:
+        for i in calls:
+            sub_model, _ = flat[i]
+            if sub_model not in collector:  # pragma: no branch
+                _sort_dep(collector, flat[i], flat)
+
+        position = max(collector.index(flat[i][0]) for i in calls)
+
+    collector.insert(position + 1, model)
diff --git a/mm_agents/coact/autogen/fast_depends/dependencies/__init__.py b/mm_agents/coact/autogen/fast_depends/dependencies/__init__.py
new file mode 100644
index 0000000..a6fca0d
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/dependencies/__init__.py
@@ -0,0 +1,15 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .model import Depends
+from .provider import Provider, dependency_provider
+
+__all__ = (
+    "Depends",
+    "Provider",
+    "dependency_provider",
+)
diff --git a/mm_agents/coact/autogen/fast_depends/dependencies/model.py b/mm_agents/coact/autogen/fast_depends/dependencies/model.py
new file mode 100644
index 0000000..4a8a481
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/dependencies/model.py
@@ -0,0 +1,29 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from typing import Any, Callable
+
+
+class Depends:
+    use_cache: bool
+    cast: bool
+
+    def __init__(
+        self,
+        dependency: Callable[..., Any],
+        *,
+        use_cache: bool = True,
+        cast: bool = True,
+    ) -> None:
+        self.dependency = dependency
+        self.use_cache = use_cache
+        self.cast = cast
+
+    def __repr__(self) -> str:
+        attr = getattr(self.dependency, "__name__", type(self.dependency).__name__)
+        cache = "" if self.use_cache else ", use_cache=False"
+        return f"{self.__class__.__name__}({attr}{cache})"
diff --git a/mm_agents/coact/autogen/fast_depends/dependencies/provider.py b/mm_agents/coact/autogen/fast_depends/dependencies/provider.py
new file mode 100644
index 0000000..2285b59
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/dependencies/provider.py
@@ -0,0 +1,39 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from contextlib import contextmanager
+from typing import Any, Callable, Dict, Iterator
+
+
+class Provider:
+    dependency_overrides: Dict[Callable[..., Any], Callable[..., Any]]
+
+    def __init__(self) -> None:
+        self.dependency_overrides = {}
+
+    def clear(self) -> None:
+        self.dependency_overrides = {}
+
+    def override(
+        self,
+        original: Callable[..., Any],
+        override: Callable[..., Any],
+    ) -> None:
+        self.dependency_overrides[original] = override
+
+    @contextmanager
+    def scope(
+        self,
+        original: Callable[..., Any],
+        override: Callable[..., Any],
+    ) -> Iterator[None]:
+        self.dependency_overrides[original] = override
+        yield
+        self.dependency_overrides.pop(original, None)
+
+
+dependency_provider = Provider()
diff --git a/mm_agents/coact/autogen/fast_depends/library/__init__.py b/mm_agents/coact/autogen/fast_depends/library/__init__.py
new file mode 100644
index 0000000..c57cce4
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/library/__init__.py
@@ -0,0 +1,10 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .model import CustomField
+
+__all__ = ("CustomField",)
diff --git a/mm_agents/coact/autogen/fast_depends/library/model.py b/mm_agents/coact/autogen/fast_depends/library/model.py
new file mode 100644
index 0000000..81bd9ab
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/library/model.py
@@ -0,0 +1,46 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from abc import ABC
+from typing import Any, Dict, Optional, TypeVar
+
+Cls = TypeVar("Cls", bound="CustomField")
+
+
+class CustomField(ABC):
+    param_name: Optional[str]
+    cast: bool
+    required: bool
+
+    __slots__ = (
+        "cast",
+        "param_name",
+        "required",
+        "field",
+    )
+
+    def __init__(
+        self,
+        *,
+        cast: bool = True,
+        required: bool = True,
+    ) -> None:
+        self.cast = cast
+        self.param_name = None
+        self.required = required
+        self.field = False
+
+    def set_param_name(self: Cls, name: str) -> Cls:
+        self.param_name = name
+        return self
+
+    def use(self, /, **kwargs: Any) -> Dict[str, Any]:
+        assert self.param_name, "You should specify `param_name` before using"
+        return kwargs
+
+    def use_field(self, kwargs: Dict[str, Any]) -> None:
+        raise NotImplementedError("You should implement `use_field` method.")
diff --git a/mm_agents/coact/autogen/fast_depends/py.typed b/mm_agents/coact/autogen/fast_depends/py.typed
new file mode 100644
index 0000000..f689fb8
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/py.typed
@@ -0,0 +1,6 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
diff --git a/mm_agents/coact/autogen/fast_depends/schema.py b/mm_agents/coact/autogen/fast_depends/schema.py
new file mode 100644
index 0000000..76231d6
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/schema.py
@@ -0,0 +1,66 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from typing import Any, Dict, List, Optional
+
+from ._compat import PYDANTIC_V2, create_model, model_schema
+from .core import CallModel
+
+
+def get_schema(
+    call: CallModel[Any, Any],
+    embed: bool = False,
+    resolve_refs: bool = False,
+) -> Dict[str, Any]:
+    assert call.model, "Call should has a model"
+    params_model = create_model(  # type: ignore[call-overload]
+        call.model.__name__, **call.flat_params
+    )
+
+    body: Dict[str, Any] = model_schema(params_model)
+
+    if not call.flat_params:
+        body = {"title": body["title"], "type": "null"}
+
+    if resolve_refs:
+        pydantic_key = "$defs" if PYDANTIC_V2 else "definitions"
+        body = _move_pydantic_refs(body, pydantic_key)
+        body.pop(pydantic_key, None)
+
+    if embed and len(body["properties"]) == 1:
+        body = list(body["properties"].values())[0]
+
+    return body
+
+
+def _move_pydantic_refs(original: Any, key: str, refs: Optional[Dict[str, Any]] = None) -> Any:
+    if not isinstance(original, Dict):
+        return original
+
+    data = original.copy()
+
+    if refs is None:
+        raw_refs = data.get(key, {})
+        refs = _move_pydantic_refs(raw_refs, key, raw_refs)
+
+    name: Optional[str] = None
+    for k in data:
+        if k == "$ref":
+            name = data[k].replace(f"#/{key}/", "")
+
+        elif isinstance(data[k], dict):
+            data[k] = _move_pydantic_refs(data[k], key, refs)
+
+        elif isinstance(data[k], List):
+            for i in range(len(data[k])):
+                data[k][i] = _move_pydantic_refs(data[k][i], key, refs)
+
+    if name:
+        assert refs, "Smth wrong"
+        data = refs[name]
+
+    return data
diff --git a/mm_agents/coact/autogen/fast_depends/use.py b/mm_agents/coact/autogen/fast_depends/use.py
new file mode 100644
index 0000000..ea5786c
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/use.py
@@ -0,0 +1,280 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from contextlib import AsyncExitStack, ExitStack
+from functools import partial, wraps
+from typing import (
+    Any,
+    AsyncIterator,
+    Callable,
+    Iterator,
+    Optional,
+    Protocol,
+    Sequence,
+    TypeVar,
+    Union,
+    cast,
+    overload,
+)
+
+from typing_extensions import ParamSpec
+
+from ._compat import ConfigDict
+from .core import CallModel, build_call_model
+from .dependencies import dependency_provider, model
+
+P = ParamSpec("P")
+T = TypeVar("T")
+
+
+def Depends(  # noqa: N802
+    dependency: Callable[P, T],
+    *,
+    use_cache: bool = True,
+    cast: bool = True,
+) -> Any:
+    return model.Depends(
+        dependency=dependency,
+        use_cache=use_cache,
+        cast=cast,
+    )
+
+
+class _InjectWrapper(Protocol[P, T]):
+    def __call__(
+        self,
+        func: Callable[P, T],
+        model: Optional[CallModel[P, T]] = None,
+    ) -> Callable[P, T]: ...
+
+
+@overload
+def inject(  # pragma: no cover
+    func: None,
+    *,
+    cast: bool = True,
+    extra_dependencies: Sequence[model.Depends] = (),
+    pydantic_config: Optional[ConfigDict] = None,
+    dependency_overrides_provider: Optional[Any] = dependency_provider,
+    wrap_model: Callable[[CallModel[P, T]], CallModel[P, T]] = lambda x: x,
+) -> _InjectWrapper[P, T]: ...
+
+
+@overload
+def inject(  # pragma: no cover
+    func: Callable[P, T],
+    *,
+    cast: bool = True,
+    extra_dependencies: Sequence[model.Depends] = (),
+    pydantic_config: Optional[ConfigDict] = None,
+    dependency_overrides_provider: Optional[Any] = dependency_provider,
+    wrap_model: Callable[[CallModel[P, T]], CallModel[P, T]] = lambda x: x,
+) -> Callable[P, T]: ...
+
+
+def inject(
+    func: Optional[Callable[P, T]] = None,
+    *,
+    cast: bool = True,
+    extra_dependencies: Sequence[model.Depends] = (),
+    pydantic_config: Optional[ConfigDict] = None,
+    dependency_overrides_provider: Optional[Any] = dependency_provider,
+    wrap_model: Callable[[CallModel[P, T]], CallModel[P, T]] = lambda x: x,
+) -> Union[
+    Callable[P, T],
+    _InjectWrapper[P, T],
+]:
+    decorator = _wrap_inject(
+        dependency_overrides_provider=dependency_overrides_provider,
+        wrap_model=wrap_model,
+        extra_dependencies=extra_dependencies,
+        cast=cast,
+        pydantic_config=pydantic_config,
+    )
+
+    if func is None:
+        return decorator
+
+    else:
+        return decorator(func)
+
+
+def _wrap_inject(
+    dependency_overrides_provider: Optional[Any],
+    wrap_model: Callable[
+        [CallModel[P, T]],
+        CallModel[P, T],
+    ],
+    extra_dependencies: Sequence[model.Depends],
+    cast: bool,
+    pydantic_config: Optional[ConfigDict],
+) -> _InjectWrapper[P, T]:
+    if (
+        dependency_overrides_provider
+        and getattr(dependency_overrides_provider, "dependency_overrides", None) is not None
+    ):
+        overrides = dependency_overrides_provider.dependency_overrides
+    else:
+        overrides = None
+
+    def func_wrapper(
+        func: Callable[P, T],
+        model: Optional[CallModel[P, T]] = None,
+    ) -> Callable[P, T]:
+        if model is None:
+            real_model = wrap_model(
+                build_call_model(
+                    call=func,
+                    extra_dependencies=extra_dependencies,
+                    cast=cast,
+                    pydantic_config=pydantic_config,
+                )
+            )
+        else:
+            real_model = model
+
+        if real_model.is_async:
+            injected_wrapper: Callable[P, T]
+
+            if real_model.is_generator:
+                injected_wrapper = partial(solve_async_gen, real_model, overrides)  # type: ignore[assignment]
+
+            else:
+
+                @wraps(func)
+                async def injected_wrapper(*args: P.args, **kwargs: P.kwargs) -> T:
+                    async with AsyncExitStack() as stack:
+                        r = await real_model.asolve(
+                            *args,
+                            stack=stack,
+                            dependency_overrides=overrides,
+                            cache_dependencies={},
+                            nested=False,
+                            **kwargs,
+                        )
+                        return r
+
+                    raise AssertionError("unreachable")
+
+        else:
+            if real_model.is_generator:
+                injected_wrapper = partial(solve_gen, real_model, overrides)  # type: ignore[assignment]
+
+            else:
+
+                @wraps(func)
+                def injected_wrapper(*args: P.args, **kwargs: P.kwargs) -> T:
+                    with ExitStack() as stack:
+                        r = real_model.solve(
+                            *args,
+                            stack=stack,
+                            dependency_overrides=overrides,
+                            cache_dependencies={},
+                            nested=False,
+                            **kwargs,
+                        )
+                        return r
+
+                    raise AssertionError("unreachable")
+
+        return injected_wrapper
+
+    return func_wrapper
+
+
+class solve_async_gen:  # noqa: N801
+    _iter: Optional[AsyncIterator[Any]] = None
+
+    def __init__(
+        self,
+        model: "CallModel[..., Any]",
+        overrides: Optional[Any],
+        *args: Any,
+        **kwargs: Any,
+    ):
+        self.call = model
+        self.args = args
+        self.kwargs = kwargs
+        self.overrides = overrides
+
+    def __aiter__(self) -> "solve_async_gen":
+        self._iter = None
+        self.stack = AsyncExitStack()
+        return self
+
+    async def __anext__(self) -> Any:
+        if self._iter is None:
+            stack = self.stack = AsyncExitStack()
+            await self.stack.__aenter__()
+            self._iter = cast(
+                AsyncIterator[Any],
+                (
+                    await self.call.asolve(
+                        *self.args,
+                        stack=stack,
+                        dependency_overrides=self.overrides,
+                        cache_dependencies={},
+                        nested=False,
+                        **self.kwargs,
+                    )
+                ).__aiter__(),
+            )
+
+        try:
+            r = await self._iter.__anext__()
+        except StopAsyncIteration as e:
+            await self.stack.__aexit__(None, None, None)
+            raise e
+        else:
+            return r
+
+
+class solve_gen:  # noqa: N801
+    _iter: Optional[Iterator[Any]] = None
+
+    def __init__(
+        self,
+        model: "CallModel[..., Any]",
+        overrides: Optional[Any],
+        *args: Any,
+        **kwargs: Any,
+    ):
+        self.call = model
+        self.args = args
+        self.kwargs = kwargs
+        self.overrides = overrides
+
+    def __iter__(self) -> "solve_gen":
+        self._iter = None
+        self.stack = ExitStack()
+        return self
+
+    def __next__(self) -> Any:
+        if self._iter is None:
+            stack = self.stack = ExitStack()
+            self.stack.__enter__()
+            self._iter = cast(
+                Iterator[Any],
+                iter(
+                    self.call.solve(
+                        *self.args,
+                        stack=stack,
+                        dependency_overrides=self.overrides,
+                        cache_dependencies={},
+                        nested=False,
+                        **self.kwargs,
+                    )
+                ),
+            )
+
+        try:
+            r = next(self._iter)
+        except StopIteration as e:
+            self.stack.__exit__(None, None, None)
+            raise e
+        else:
+            return r
diff --git a/mm_agents/coact/autogen/fast_depends/utils.py b/mm_agents/coact/autogen/fast_depends/utils.py
new file mode 100644
index 0000000..c726264
--- /dev/null
+++ b/mm_agents/coact/autogen/fast_depends/utils.py
@@ -0,0 +1,187 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/https://github.com/Lancetnik/FastDepends are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import asyncio
+import functools
+import inspect
+from contextlib import AsyncExitStack, ExitStack, asynccontextmanager, contextmanager
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    AsyncGenerator,
+    AsyncIterable,
+    Awaitable,
+    Callable,
+    ContextManager,
+    Dict,
+    ForwardRef,
+    List,
+    Tuple,
+    TypeVar,
+    Union,
+    cast,
+)
+
+import anyio
+from typing_extensions import (
+    Annotated,
+    ParamSpec,
+    get_args,
+    get_origin,
+)
+
+from ._compat import evaluate_forwardref
+
+if TYPE_CHECKING:
+    from types import FrameType
+
+P = ParamSpec("P")
+T = TypeVar("T")
+
+
+async def run_async(
+    func: Union[
+        Callable[P, T],
+        Callable[P, Awaitable[T]],
+    ],
+    *args: P.args,
+    **kwargs: P.kwargs,
+) -> T:
+    if is_coroutine_callable(func):
+        return await cast(Callable[P, Awaitable[T]], func)(*args, **kwargs)
+    else:
+        return await run_in_threadpool(cast(Callable[P, T], func), *args, **kwargs)
+
+
+async def run_in_threadpool(func: Callable[P, T], *args: P.args, **kwargs: P.kwargs) -> T:
+    if kwargs:
+        func = functools.partial(func, **kwargs)
+    return await anyio.to_thread.run_sync(func, *args)
+
+
+async def solve_generator_async(
+    *sub_args: Any, call: Callable[..., Any], stack: AsyncExitStack, **sub_values: Any
+) -> Any:
+    if is_gen_callable(call):
+        cm = contextmanager_in_threadpool(contextmanager(call)(**sub_values))
+    elif is_async_gen_callable(call):  # pragma: no branch
+        cm = asynccontextmanager(call)(*sub_args, **sub_values)
+    return await stack.enter_async_context(cm)
+
+
+def solve_generator_sync(*sub_args: Any, call: Callable[..., Any], stack: ExitStack, **sub_values: Any) -> Any:
+    cm = contextmanager(call)(*sub_args, **sub_values)
+    return stack.enter_context(cm)
+
+
+def get_typed_signature(call: Callable[..., Any]) -> Tuple[inspect.Signature, Any]:
+    signature = inspect.signature(call)
+
+    locals = collect_outer_stack_locals()
+
+    # We unwrap call to get the original unwrapped function
+    call = inspect.unwrap(call)
+
+    globalns = getattr(call, "__globals__", {})
+    typed_params = [
+        inspect.Parameter(
+            name=param.name,
+            kind=param.kind,
+            default=param.default,
+            annotation=get_typed_annotation(
+                param.annotation,
+                globalns,
+                locals,
+            ),
+        )
+        for param in signature.parameters.values()
+    ]
+
+    return inspect.Signature(typed_params), get_typed_annotation(
+        signature.return_annotation,
+        globalns,
+        locals,
+    )
+
+
+def collect_outer_stack_locals() -> Dict[str, Any]:
+    frame = inspect.currentframe()
+
+    frames: List[FrameType] = []
+    while frame is not None:
+        if "fast_depends" not in frame.f_code.co_filename:
+            frames.append(frame)
+        frame = frame.f_back
+
+    locals = {}
+    for f in frames[::-1]:
+        locals.update(f.f_locals)
+
+    return locals
+
+
+def get_typed_annotation(
+    annotation: Any,
+    globalns: Dict[str, Any],
+    locals: Dict[str, Any],
+) -> Any:
+    if isinstance(annotation, str):
+        annotation = ForwardRef(annotation)
+
+    if isinstance(annotation, ForwardRef):
+        annotation = evaluate_forwardref(annotation, globalns, locals)
+
+    if get_origin(annotation) is Annotated and (args := get_args(annotation)):
+        solved_args = [get_typed_annotation(x, globalns, locals) for x in args]
+        annotation.__origin__, annotation.__metadata__ = solved_args[0], tuple(solved_args[1:])
+
+    return annotation
+
+
+@asynccontextmanager
+async def contextmanager_in_threadpool(
+    cm: ContextManager[T],
+) -> AsyncGenerator[T, None]:
+    exit_limiter = anyio.CapacityLimiter(1)
+    try:
+        yield await run_in_threadpool(cm.__enter__)
+    except Exception as e:
+        ok = bool(await anyio.to_thread.run_sync(cm.__exit__, type(e), e, None, limiter=exit_limiter))
+        if not ok:  # pragma: no branch
+            raise e
+    else:
+        await anyio.to_thread.run_sync(cm.__exit__, None, None, None, limiter=exit_limiter)
+
+
+def is_gen_callable(call: Callable[..., Any]) -> bool:
+    if inspect.isgeneratorfunction(call):
+        return True
+    dunder_call = getattr(call, "__call__", None)  # noqa: B004
+    return inspect.isgeneratorfunction(dunder_call)
+
+
+def is_async_gen_callable(call: Callable[..., Any]) -> bool:
+    if inspect.isasyncgenfunction(call):
+        return True
+    dunder_call = getattr(call, "__call__", None)  # noqa: B004
+    return inspect.isasyncgenfunction(dunder_call)
+
+
+def is_coroutine_callable(call: Callable[..., Any]) -> bool:
+    if inspect.isclass(call):
+        return False
+
+    if asyncio.iscoroutinefunction(call):
+        return True
+
+    dunder_call = getattr(call, "__call__", None)  # noqa: B004
+    return asyncio.iscoroutinefunction(dunder_call)
+
+
+async def async_map(func: Callable[..., T], async_iterable: AsyncIterable[Any]) -> AsyncIterable[T]:
+    async for i in async_iterable:
+        yield func(i)
diff --git a/mm_agents/coact/autogen/formatting_utils.py b/mm_agents/coact/autogen/formatting_utils.py
new file mode 100644
index 0000000..c93dd95
--- /dev/null
+++ b/mm_agents/coact/autogen/formatting_utils.py
@@ -0,0 +1,83 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+from collections.abc import Iterable
+from typing import Literal, Optional
+
+from .import_utils import optional_import_block
+
+with optional_import_block() as result:
+    from termcolor import colored
+
+if not result.is_successful:
+    # termcolor is an optional dependency - if it cannot be imported then no color is used.
+    # Alternatively the envvar NO_COLOR can be used to disable color.
+    # To allow for proper typing and for termcolor to be optional we need to re-define the types used in the lib here.
+    # This is the direct function definition from termcolor.
+    Attribute = Literal[
+        "bold",
+        "dark",
+        "underline",
+        "blink",
+        "reverse",
+        "concealed",
+    ]
+
+    Highlight = Literal[
+        "on_black",
+        "on_grey",
+        "on_red",
+        "on_green",
+        "on_yellow",
+        "on_blue",
+        "on_magenta",
+        "on_cyan",
+        "on_light_grey",
+        "on_dark_grey",
+        "on_light_red",
+        "on_light_green",
+        "on_light_yellow",
+        "on_light_blue",
+        "on_light_magenta",
+        "on_light_cyan",
+        "on_white",
+    ]
+
+    Color = Literal[
+        "black",
+        "grey",
+        "red",
+        "green",
+        "yellow",
+        "blue",
+        "magenta",
+        "cyan",
+        "light_grey",
+        "dark_grey",
+        "light_red",
+        "light_green",
+        "light_yellow",
+        "light_blue",
+        "light_magenta",
+        "light_cyan",
+        "white",
+    ]
+
+    def colored(
+        text: object,
+        color: Optional[Color] = None,
+        on_color: Optional[Highlight] = None,
+        attrs: Optional[Iterable[Attribute]] = None,
+        *,
+        no_color: Optional[bool] = None,
+        force_color: Optional[bool] = None,
+    ) -> str:
+        return str(text)
+
+
+__all__ = ["colored"]
diff --git a/mm_agents/coact/autogen/function_utils.py b/mm_agents/coact/autogen/function_utils.py
new file mode 100644
index 0000000..9292dc9
--- /dev/null
+++ b/mm_agents/coact/autogen/function_utils.py
@@ -0,0 +1,13 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from logging import getLogger
+
+from .tools import get_function_schema, load_basemodels_if_needed, serialize_to_str
+
+__all__ = ["get_function_schema", "load_basemodels_if_needed", "serialize_to_str"]
+
+logger = getLogger(__name__)
+
+logger.info("Importing from 'autogen.function_utils' is deprecated, import from 'autogen.tools' instead.")
diff --git a/mm_agents/coact/autogen/graph_utils.py b/mm_agents/coact/autogen/graph_utils.py
new file mode 100644
index 0000000..ed148ea
--- /dev/null
+++ b/mm_agents/coact/autogen/graph_utils.py
@@ -0,0 +1,178 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import logging
+from typing import Optional
+
+from .agentchat import Agent
+from .import_utils import optional_import_block, require_optional_import
+
+with optional_import_block():
+    import matplotlib.pyplot as plt
+    import networkx as nx
+
+
+def has_self_loops(allowed_speaker_transitions: dict[str, list[Agent]]) -> bool:
+    """Check if there are self loops in the allowed_speaker_transitions.
+
+    Args:
+        allowed_speaker_transitions (dict[str, list[Agent]]): A dictionary of keys and list as values. The keys are the names of the agents, and the values are the names of the agents that the key agent can transition
+
+    Returns:
+        True if there are self loops in the allowed_speaker_transitions_Dict.
+    """
+
+    return any([key in value for key, value in allowed_speaker_transitions.items()])
+
+
+def check_graph_validity(
+    allowed_speaker_transitions_dict: dict[str, list[Agent]],
+    agents: list[Agent],
+) -> None:
+    """Check the validity of the allowed_speaker_transitions_dict.
+
+    Args:
+        allowed_speaker_transitions_dict (dict[str, list[Agent]]):
+            A dictionary of keys and list as values. The keys are the names of the agents, and the values are the names of the agents that the key agent can transition to.
+        agents (list[Agent]): A list of Agents
+
+    agents: A list of Agents
+
+    Checks for the following:
+        Errors
+        1. The dictionary must have a structure of keys and list as values
+        2. Every key exists in agents.
+        3. Every value is a list of Agents (not string).
+
+    Warnings:
+        1. Warning if there are isolated agent nodes
+        2. Warning if the set of agents in allowed_speaker_transitions do not match agents
+        3. Warning if there are duplicated agents in any values of `allowed_speaker_transitions_dict`
+    """
+    # Errors
+
+    # Check 1. The dictionary must have a structure of keys and list as values
+    if not isinstance(allowed_speaker_transitions_dict, dict):
+        raise ValueError("allowed_speaker_transitions_dict must be a dictionary.")
+
+    # All values must be lists of Agent or empty
+    if not all([isinstance(value, list) for value in allowed_speaker_transitions_dict.values()]):
+        raise ValueError("allowed_speaker_transitions_dict must be a dictionary with lists as values.")
+
+    # Check 2. Every key exists in agents
+    if not all([key in agents for key in allowed_speaker_transitions_dict]):
+        raise ValueError("allowed_speaker_transitions_dict has keys not in agents.")
+
+    # Check 3. Every value is a list of Agents or empty list (not string).
+    if not all([
+        all([isinstance(agent, Agent) for agent in value]) for value in allowed_speaker_transitions_dict.values()
+    ]):
+        raise ValueError("allowed_speaker_transitions_dict has values that are not lists of Agents.")
+
+    # Warnings
+    # Warning 1. Warning if there are isolated agent nodes, there are not incoming nor outgoing edges
+    # Concat keys if len(value) is positive
+    has_outgoing_edge = []
+    for key, agent_list in allowed_speaker_transitions_dict.items():
+        if len(agent_list) > 0:
+            has_outgoing_edge.append(key)
+    no_outgoing_edges = [agent for agent in agents if agent not in has_outgoing_edge]
+
+    # allowed_speaker_transitions_dict.values() is a list of list of Agents
+    # values_all_agents is a list of all agents in allowed_speaker_transitions_dict.values()
+    has_incoming_edge = []
+    for agent_list in allowed_speaker_transitions_dict.values():
+        if len(agent_list) > 0:
+            has_incoming_edge.extend(agent_list)
+
+    no_incoming_edges = [agent for agent in agents if agent not in has_incoming_edge]
+
+    isolated_agents = set(no_incoming_edges).intersection(set(no_outgoing_edges))
+    if len(isolated_agents) > 0:
+        logging.warning(
+            f"""Warning: There are isolated agent nodes, there are not incoming nor outgoing edges. Isolated agents: {[agent.name for agent in isolated_agents]}"""
+        )
+
+    # Warning 2. Warning if the set of agents in allowed_speaker_transitions do not match agents
+    # Get set of agents
+    agents_in_allowed_speaker_transitions = set(has_incoming_edge).union(set(has_outgoing_edge))
+    full_anti_join = set(agents_in_allowed_speaker_transitions).symmetric_difference(set(agents))
+    if len(full_anti_join) > 0:
+        logging.warning(
+            f"""Warning: The set of agents in allowed_speaker_transitions do not match agents. Offending agents: {[agent.name for agent in full_anti_join]}"""
+        )
+
+    # Warning 3. Warning if there are duplicated agents in any values of `allowed_speaker_transitions_dict`
+    for key, values in allowed_speaker_transitions_dict.items():
+        duplicates = [item for item in values if values.count(item) > 1]
+        unique_duplicates = list(set(duplicates))
+        if unique_duplicates:
+            logging.warning(
+                f"Agent '{key.name}' has duplicate elements: {[agent.name for agent in unique_duplicates]}. Please remove duplicates manually."
+            )
+
+
+def invert_disallowed_to_allowed(
+    disallowed_speaker_transitions_dict: dict[str, list[Agent]], agents: list[Agent]
+) -> dict[str, list[Agent]]:
+    """Invert the disallowed_speaker_transitions_dict to form the allowed_speaker_transitions_dict.
+
+    Start with a fully connected allowed_speaker_transitions_dict of all agents. Remove edges from the fully connected allowed_speaker_transitions_dict according to the disallowed_speaker_transitions_dict to form the allowed_speaker_transitions_dict.
+
+    Args:
+        disallowed_speaker_transitions_dict: A dictionary of keys and list as values. The keys are the names of the agents, and the values are the names of the agents that the key agent cannot transition to.
+        agents: A list of Agents
+
+    Returns:
+        allowed_speaker_transitions_dict: A dictionary of keys and list as values. The keys are the names of the agents, and the values are the names of the agents that the key agent can transition to.
+    """
+    # Create a fully connected allowed_speaker_transitions_dict of all agents
+    allowed_speaker_transitions_dict = {agent: [other_agent for other_agent in agents] for agent in agents}
+
+    # Remove edges from allowed_speaker_transitions_dict according to the disallowed_speaker_transitions_dict
+    for key, value in disallowed_speaker_transitions_dict.items():
+        allowed_speaker_transitions_dict[key] = [
+            agent for agent in allowed_speaker_transitions_dict[key] if agent not in value
+        ]
+
+    return allowed_speaker_transitions_dict
+
+
+@require_optional_import(["matplotlib", "networkx"], "graph")
+def visualize_speaker_transitions_dict(
+    speaker_transitions_dict: dict[str, list[Agent]], agents: list[Agent], export_path: Optional[str] = None
+) -> None:
+    """Visualize the speaker_transitions_dict using networkx.
+
+    Args:
+        speaker_transitions_dict: A dictionary of keys and list as values. The keys are the names of the agents, and the values are the names of the agents that the key agent can transition to.
+        agents: A list of Agents
+        export_path: The path to export the graph. If None, the graph will be shown.
+
+    Returns:
+        None
+
+
+    """
+
+    g = nx.DiGraph()
+
+    # Add nodes
+    g.add_nodes_from([agent.name for agent in agents])
+
+    # Add edges
+    for key, value in speaker_transitions_dict.items():
+        for agent in value:
+            g.add_edge(key.name, agent.name)
+
+    # Visualize
+    nx.draw(g, with_labels=True, font_weight="bold")
+
+    if export_path is not None:
+        plt.savefig(export_path)
+    else:
+        plt.show()
diff --git a/mm_agents/coact/autogen/import_utils.py b/mm_agents/coact/autogen/import_utils.py
new file mode 100644
index 0000000..b582380
--- /dev/null
+++ b/mm_agents/coact/autogen/import_utils.py
@@ -0,0 +1,526 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import inspect
+import re
+import sys
+from abc import ABC, abstractmethod
+from contextlib import contextmanager, suppress
+from dataclasses import dataclass
+from functools import wraps
+from logging import getLogger
+from pathlib import Path
+from typing import Any, Callable, Generator, Generic, Iterable, Optional, TypeVar, Union
+
+__all__ = [
+    "optional_import_block",
+    "patch_object",
+    "require_optional_import",
+    "run_for_optional_imports",
+    "skip_on_missing_imports",
+]
+
+logger = getLogger(__name__)
+
+
+@dataclass
+class ModuleInfo:
+    name: str
+    min_version: Optional[str] = None
+    max_version: Optional[str] = None
+    min_inclusive: bool = False
+    max_inclusive: bool = False
+
+    def is_in_sys_modules(self) -> Optional[str]:
+        """Check if the module is installed and satisfies the version constraints
+
+        Returns:
+            None if the module is installed and satisfies the version constraints, otherwise a message indicating the issue.
+
+        """
+        if self.name not in sys.modules:
+            return f"'{self.name}' is not installed."
+        else:
+            if hasattr(sys.modules[self.name], "__file__") and sys.modules[self.name].__file__ is not None:
+                autogen_path = (Path(__file__).parent).resolve()
+                test_path = (Path(__file__).parent.parent / "test").resolve()
+                module_path = Path(sys.modules[self.name].__file__).resolve()  # type: ignore[arg-type]
+
+                if str(autogen_path) in str(module_path) or str(test_path) in str(module_path):
+                    # The module is in the autogen or test directory
+                    # Aka similarly named module in the autogen or test directory
+                    return f"'{self.name}' is not installed."
+
+        installed_version = (
+            sys.modules[self.name].__version__ if hasattr(sys.modules[self.name], "__version__") else None
+        )
+        if installed_version is None and (self.min_version or self.max_version):
+            return f"'{self.name}' is installed, but the version is not available."
+
+        if self.min_version:
+            msg = f"'{self.name}' is installed, but the installed version {installed_version} is too low (required '{self}')."
+            if not self.min_inclusive and installed_version == self.min_version:
+                return msg
+            if self.min_inclusive and installed_version < self.min_version:  # type: ignore[operator]
+                return msg
+
+        if self.max_version:
+            msg = f"'{self.name}' is installed, but the installed version {installed_version} is too high (required '{self}')."
+            if not self.max_inclusive and installed_version == self.max_version:
+                return msg
+            if self.max_inclusive and installed_version > self.max_version:  # type: ignore[operator]
+                return msg
+
+        return None
+
+    def __repr__(self) -> str:
+        s = self.name
+        if self.min_version:
+            s += f">={self.min_version}" if self.min_inclusive else f">{self.min_version}"
+        if self.max_version:
+            s += f"<={self.max_version}" if self.max_inclusive else f"<{self.max_version}"
+        return s
+
+    @classmethod
+    def from_str(cls, module_info: str) -> "ModuleInfo":
+        """Parse a string to create a ModuleInfo object
+
+        Args:
+            module_info (str): A string containing the module name and optional version constraints
+
+        Returns:
+            ModuleInfo: A ModuleInfo object with the parsed information
+
+        Raises:
+            ValueError: If the module information is invalid
+        """
+
+        pattern = re.compile(r"^(?P<name>[a-zA-Z0-9-_]+)(?P<constraint>.*)$")
+        match = pattern.match(module_info.strip())
+
+        if not match:
+            raise ValueError(f"Invalid package information: {module_info}")
+
+        name = match.group("name")
+        constraints = match.group("constraint").strip()
+        min_version = max_version = None
+        min_inclusive = max_inclusive = False
+
+        if constraints:
+            constraint_pattern = re.findall(r"(>=|<=|>|<)([0-9\.]+)?", constraints)
+
+            if not all(version for _, version in constraint_pattern):
+                raise ValueError(f"Invalid module information: {module_info}")
+
+            for operator, version in constraint_pattern:
+                if operator == ">=":
+                    min_version = version
+                    min_inclusive = True
+                elif operator == "<=":
+                    max_version = version
+                    max_inclusive = True
+                elif operator == ">":
+                    min_version = version
+                    min_inclusive = False
+                elif operator == "<":
+                    max_version = version
+                    max_inclusive = False
+                else:
+                    raise ValueError(f"Invalid package information: {module_info}")
+
+        return ModuleInfo(
+            name=name,
+            min_version=min_version,
+            max_version=max_version,
+            min_inclusive=min_inclusive,
+            max_inclusive=max_inclusive,
+        )
+
+
+class Result:
+    def __init__(self) -> None:
+        self._failed: Optional[bool] = None
+
+    @property
+    def is_successful(self) -> bool:
+        if self._failed is None:
+            raise ValueError("Result not set")
+        return not self._failed
+
+
+@contextmanager
+def optional_import_block() -> Generator[Result, None, None]:
+    """Guard a block of code to suppress ImportErrors
+
+    A context manager to temporarily suppress ImportErrors.
+    Use this to attempt imports without failing immediately on missing modules.
+
+    Example:
+    ```python
+    with optional_import_block():
+        import some_module
+        import some_other_module
+    ```
+    """
+    result = Result()
+    try:
+        yield result
+        result._failed = False
+    except ImportError as e:
+        # Ignore ImportErrors during this context
+        logger.debug(f"Ignoring ImportError: {e}")
+        result._failed = True
+
+
+def get_missing_imports(modules: Union[str, Iterable[str]]) -> dict[str, str]:
+    """Get missing modules from a list of module names
+
+    Args:
+        modules (Union[str, Iterable[str]]): Module name or list of module names
+
+    Returns:
+        List of missing module names
+    """
+    if isinstance(modules, str):
+        modules = [modules]
+
+    module_infos = [ModuleInfo.from_str(module) for module in modules]
+    x = {m.name: m.is_in_sys_modules() for m in module_infos}
+    return {k: v for k, v in x.items() if v}
+
+
+T = TypeVar("T")
+G = TypeVar("G", bound=Union[Callable[..., Any], type])
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+class PatchObject(ABC, Generic[T]):
+    def __init__(self, o: T, missing_modules: dict[str, str], dep_target: str):
+        if not self.accept(o):
+            raise ValueError(f"Cannot patch object of type {type(o)}")
+
+        self.o = o
+        self.missing_modules = missing_modules
+        self.dep_target = dep_target
+
+    @classmethod
+    @abstractmethod
+    def accept(cls, o: Any) -> bool: ...
+
+    @abstractmethod
+    def patch(self, except_for: Iterable[str]) -> T: ...
+
+    def get_object_with_metadata(self) -> Any:
+        return self.o
+
+    @property
+    def msg(self) -> str:
+        o = self.get_object_with_metadata()
+        plural = len(self.missing_modules) > 1
+        fqn = f"{o.__module__}.{o.__name__}" if hasattr(o, "__module__") else o.__name__
+        # modules_str = ", ".join([f"'{m}'" for m in self.missing_modules])
+        msg = f"{'Modules' if plural else 'A module'} needed for {fqn} {'are' if plural else 'is'} missing:\n"
+        for _, status in self.missing_modules.items():
+            msg += f" - {status}\n"
+        msg += f"Please install {'them' if plural else 'it'} using:\n'pip install ag2[{self.dep_target}]'"
+        return msg
+
+    def copy_metadata(self, retval: T) -> None:
+        """Copy metadata from original object to patched object
+
+        Args:
+            retval: Patched object
+
+        """
+        o = self.o
+        if hasattr(o, "__doc__"):
+            retval.__doc__ = o.__doc__
+        if hasattr(o, "__name__"):
+            retval.__name__ = o.__name__  # type: ignore[attr-defined]
+        if hasattr(o, "__module__"):
+            retval.__module__ = o.__module__
+
+    _registry: list[type["PatchObject[Any]"]] = []
+
+    @classmethod
+    def register(cls) -> Callable[[type["PatchObject[Any]"]], type["PatchObject[Any]"]]:
+        def decorator(subclass: type["PatchObject[Any]"]) -> type["PatchObject[Any]"]:
+            cls._registry.append(subclass)
+            return subclass
+
+        return decorator
+
+    @classmethod
+    def create(
+        cls,
+        o: T,
+        *,
+        missing_modules: dict[str, str],
+        dep_target: str,
+    ) -> Optional["PatchObject[T]"]:
+        for subclass in cls._registry:
+            if subclass.accept(o):
+                return subclass(o, missing_modules, dep_target)
+        return None
+
+
+@PatchObject.register()
+class PatchCallable(PatchObject[F]):
+    @classmethod
+    def accept(cls, o: Any) -> bool:
+        return inspect.isfunction(o) or inspect.ismethod(o)
+
+    def patch(self, except_for: Iterable[str]) -> F:
+        if self.o.__name__ in except_for:
+            return self.o
+
+        f: Callable[..., Any] = self.o
+
+        # @wraps(f.__call__)  # type: ignore[operator]
+        @wraps(f)
+        def _call(*args: Any, **kwargs: Any) -> Any:
+            raise ImportError(self.msg)
+
+        self.copy_metadata(_call)  # type: ignore[arg-type]
+
+        return _call  # type: ignore[return-value]
+
+
+@PatchObject.register()
+class PatchStatic(PatchObject[F]):
+    @classmethod
+    def accept(cls, o: Any) -> bool:
+        # return inspect.ismethoddescriptor(o)
+        return isinstance(o, staticmethod)
+
+    def patch(self, except_for: Iterable[str]) -> F:
+        if hasattr(self.o, "__name__"):
+            name = self.o.__name__
+        elif hasattr(self.o, "__func__"):
+            name = self.o.__func__.__name__
+        else:
+            raise ValueError(f"Cannot determine name for object {self.o}")
+        if name in except_for:
+            return self.o
+
+        f: Callable[..., Any] = self.o.__func__  # type: ignore[attr-defined]
+
+        @wraps(f)
+        def _call(*args: Any, **kwargs: Any) -> Any:
+            raise ImportError(self.msg)
+
+        self.copy_metadata(_call)  # type: ignore[arg-type]
+
+        return staticmethod(_call)  # type: ignore[return-value]
+
+    def get_object_with_metadata(self) -> Any:
+        return self.o.__func__  # type: ignore[attr-defined]
+
+
+@PatchObject.register()
+class PatchInit(PatchObject[F]):
+    @classmethod
+    def accept(cls, o: Any) -> bool:
+        return inspect.ismethoddescriptor(o) and o.__name__ == "__init__"
+
+    def patch(self, except_for: Iterable[str]) -> F:
+        if self.o.__name__ in except_for:
+            return self.o
+
+        f: Callable[..., Any] = self.o
+
+        @wraps(f)
+        def _call(*args: Any, **kwargs: Any) -> Any:
+            raise ImportError(self.msg)
+
+        self.copy_metadata(_call)  # type: ignore[arg-type]
+
+        return staticmethod(_call)  # type: ignore[return-value]
+
+    def get_object_with_metadata(self) -> Any:
+        return self.o
+
+
+@PatchObject.register()
+class PatchProperty(PatchObject[Any]):
+    @classmethod
+    def accept(cls, o: Any) -> bool:
+        return inspect.isdatadescriptor(o) and hasattr(o, "fget")
+
+    def patch(self, except_for: Iterable[str]) -> property:
+        if not hasattr(self.o, "fget"):
+            raise ValueError(f"Cannot patch property without getter: {self.o}")
+        f: Callable[..., Any] = self.o.fget
+
+        if f.__name__ in except_for:
+            return self.o  # type: ignore[no-any-return]
+
+        @wraps(f)
+        def _call(*args: Any, **kwargs: Any) -> Any:
+            raise ImportError(self.msg)
+
+        self.copy_metadata(_call)
+
+        return property(_call)
+
+    def get_object_with_metadata(self) -> Any:
+        return self.o.fget
+
+
+@PatchObject.register()
+class PatchClass(PatchObject[type[Any]]):
+    @classmethod
+    def accept(cls, o: Any) -> bool:
+        return inspect.isclass(o)
+
+    def patch(self, except_for: Iterable[str]) -> type[Any]:
+        if self.o.__name__ in except_for:
+            return self.o
+
+        for name, member in inspect.getmembers(self.o):
+            # Patch __init__ method if possible, but not other internal methods
+            if name.startswith("__") and name != "__init__":
+                continue
+            patched = patch_object(
+                member,
+                missing_modules=self.missing_modules,
+                dep_target=self.dep_target,
+                fail_if_not_patchable=False,
+                except_for=except_for,
+            )
+            with suppress(AttributeError):
+                setattr(self.o, name, patched)
+
+        return self.o
+
+
+def patch_object(
+    o: T,
+    *,
+    missing_modules: dict[str, str],
+    dep_target: str,
+    fail_if_not_patchable: bool = True,
+    except_for: Optional[Union[str, Iterable[str]]] = None,
+) -> T:
+    patcher = PatchObject.create(o, missing_modules=missing_modules, dep_target=dep_target)
+    if fail_if_not_patchable and patcher is None:
+        raise ValueError(f"Cannot patch object of type {type(o)}")
+
+    except_for = except_for if except_for is not None else []
+    except_for = [except_for] if isinstance(except_for, str) else except_for
+
+    return patcher.patch(except_for=except_for) if patcher else o
+
+
+def require_optional_import(
+    modules: Union[str, Iterable[str]],
+    dep_target: str,
+    *,
+    except_for: Optional[Union[str, Iterable[str]]] = None,
+) -> Callable[[T], T]:
+    """Decorator to handle optional module dependencies
+
+    Args:
+        modules: Module name or list of module names required
+        dep_target: Target name for pip installation (e.g. 'test' in pip install ag2[test])
+        except_for: Name or list of names of objects to exclude from patching
+    """
+    missing_modules = get_missing_imports(modules)
+
+    if not missing_modules:
+
+        def decorator(o: T) -> T:
+            return o
+
+    else:
+
+        def decorator(o: T) -> T:
+            return patch_object(o, missing_modules=missing_modules, dep_target=dep_target, except_for=except_for)
+
+    return decorator
+
+
+def _mark_object(o: T, dep_target: str) -> T:
+    import pytest
+
+    markname = dep_target.replace("-", "_")
+    pytest_mark_markname = getattr(pytest.mark, markname)
+    pytest_mark_o = pytest_mark_markname(o)
+
+    pytest_mark_o = pytest.mark.aux_neg_flag(pytest_mark_o)
+
+    return pytest_mark_o  # type: ignore[no-any-return]
+
+
+def run_for_optional_imports(modules: Union[str, Iterable[str]], dep_target: str) -> Callable[[G], G]:
+    """Decorator to run a test if and only if optional modules are installed
+
+    Args:
+        modules: Module name or list of module names
+        dep_target: Target name for pip installation (e.g. 'test' in pip install ag2[test])
+    """
+    # missing_modules = get_missing_imports(modules)
+    # if missing_modules:
+    #     raise ImportError(f"Missing module{'s' if len(missing_modules) > 1 else ''}: {', '.join(missing_modules)}. Install using 'pip install ag2[{dep_target}]'")
+
+    def decorator(o: G) -> G:
+        missing_modules = get_missing_imports(modules)
+
+        if isinstance(o, type):
+            wrapped = require_optional_import(modules, dep_target)(o)
+        else:
+            if inspect.iscoroutinefunction(o):
+
+                @wraps(o)
+                async def wrapped(*args: Any, **kwargs: Any) -> Any:
+                    if missing_modules:
+                        raise ImportError(
+                            f"Missing module{'s' if len(missing_modules) > 1 else ''}: {', '.join(missing_modules)}. Install using 'pip install ag2[{dep_target}]'"
+                        )
+                    return await o(*args, **kwargs)
+
+            else:
+
+                @wraps(o)
+                def wrapped(*args: Any, **kwargs: Any) -> Any:
+                    if missing_modules:
+                        raise ImportError(
+                            f"Missing module{'s' if len(missing_modules) > 1 else ''}: {', '.join(missing_modules)}. Install using 'pip install ag2[{dep_target}]'"
+                        )
+                    return o(*args, **kwargs)
+
+        pytest_mark_o: G = _mark_object(wrapped, dep_target)  # type: ignore[assignment]
+
+        return pytest_mark_o
+
+    return decorator
+
+
+def skip_on_missing_imports(modules: Union[str, Iterable[str]], dep_target: str) -> Callable[[T], T]:
+    """Decorator to skip a test if an optional module is missing
+
+    Args:
+        modules: Module name or list of module names
+        dep_target: Target name for pip installation (e.g. 'test' in pip install ag2[test])
+    """
+    import pytest
+
+    missing_modules = get_missing_imports(modules)
+
+    if not missing_modules:
+
+        def decorator(o: T) -> T:
+            pytest_mark_o = _mark_object(o, dep_target)
+            return pytest_mark_o  # type: ignore[no-any-return]
+
+    else:
+
+        def decorator(o: T) -> T:
+            pytest_mark_o = _mark_object(o, dep_target)
+
+            return pytest.mark.skip(  # type: ignore[return-value,no-any-return]
+                f"Missing module{'s' if len(missing_modules) > 1 else ''}: {', '.join(missing_modules)}. Install using 'pip install ag2[{dep_target}]'"
+            )(pytest_mark_o)
+
+    return decorator
diff --git a/mm_agents/coact/autogen/interop/__init__.py b/mm_agents/coact/autogen/interop/__init__.py
new file mode 100644
index 0000000..178f0bc
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/__init__.py
@@ -0,0 +1,22 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .crewai import CrewAIInteroperability
+from .interoperability import Interoperability
+from .interoperable import Interoperable
+from .langchain import LangChainChatModelFactory, LangChainInteroperability
+from .litellm import LiteLLmConfigFactory
+from .pydantic_ai import PydanticAIInteroperability
+from .registry import register_interoperable_class
+
+__all__ = [
+    "CrewAIInteroperability",
+    "Interoperability",
+    "Interoperable",
+    "LangChainChatModelFactory",
+    "LangChainInteroperability",
+    "LiteLLmConfigFactory",
+    "PydanticAIInteroperability",
+    "register_interoperable_class",
+]
diff --git a/mm_agents/coact/autogen/interop/crewai/__init__.py b/mm_agents/coact/autogen/interop/crewai/__init__.py
new file mode 100644
index 0000000..8c225a3
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/crewai/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .crewai import CrewAIInteroperability
+
+__all__ = ["CrewAIInteroperability"]
diff --git a/mm_agents/coact/autogen/interop/crewai/crewai.py b/mm_agents/coact/autogen/interop/crewai/crewai.py
new file mode 100644
index 0000000..af5f0ce
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/crewai/crewai.py
@@ -0,0 +1,88 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import re
+import sys
+from typing import Any, Optional
+
+from ...doc_utils import export_module
+from ...import_utils import optional_import_block, require_optional_import
+from ...tools import Tool
+from ..registry import register_interoperable_class
+
+__all__ = ["CrewAIInteroperability"]
+
+
+def _sanitize_name(s: str) -> str:
+    return re.sub(r"\W|^(?=\d)", "_", s)
+
+
+with optional_import_block():
+    from crewai.tools import BaseTool as CrewAITool
+
+
+@register_interoperable_class("crewai")
+@export_module("autogen.interop")
+class CrewAIInteroperability:
+    """A class implementing the `Interoperable` protocol for converting CrewAI tools
+    to a general `Tool` format.
+
+    This class takes a `CrewAITool` and converts it into a standard `Tool` object.
+    """
+
+    @classmethod
+    @require_optional_import("crewai", "interop-crewai")
+    def convert_tool(cls, tool: Any, **kwargs: Any) -> Tool:
+        """Converts a given CrewAI tool into a general `Tool` format.
+
+        This method ensures that the provided tool is a valid `CrewAITool`, sanitizes
+        the tool's name, processes its description, and prepares a function to interact
+        with the tool's arguments. It then returns a standardized `Tool` object.
+
+        Args:
+            tool (Any): The tool to convert, expected to be an instance of `CrewAITool`.
+            **kwargs (Any): Additional arguments, which are not supported by this method.
+
+        Returns:
+            Tool: A standardized `Tool` object converted from the CrewAI tool.
+
+        Raises:
+            ValueError: If the provided tool is not an instance of `CrewAITool`, or if
+                        any additional arguments are passed.
+        """
+        if not isinstance(tool, CrewAITool):
+            raise ValueError(f"Expected an instance of `crewai.tools.BaseTool`, got {type(tool)}")
+        if kwargs:
+            raise ValueError(f"The CrewAIInteroperability does not support any additional arguments, got {kwargs}")
+
+        # needed for type checking
+        crewai_tool: CrewAITool = tool  # type: ignore[no-any-unimported]
+
+        name = _sanitize_name(crewai_tool.name)
+        description = (
+            crewai_tool.description.split("Tool Description: ")[-1]
+            + " (IMPORTANT: When using arguments, put them all in an `args` dictionary)"
+        )
+
+        def func(args: crewai_tool.args_schema) -> Any:  # type: ignore[no-any-unimported]
+            return crewai_tool.run(**args.model_dump())
+
+        return Tool(
+            name=name,
+            description=description,
+            func_or_tool=func,
+        )
+
+    @classmethod
+    def get_unsupported_reason(cls) -> Optional[str]:
+        if sys.version_info < (3, 10) or sys.version_info >= (3, 13):
+            return "This submodule is only supported for Python versions 3.10, 3.11, and 3.12"
+
+        with optional_import_block() as result:
+            import crewai.tools  # noqa: F401
+
+        if not result.is_successful:
+            return "Please install `interop-crewai` extra to use this module:\n\n\tpip install ag2[interop-crewai]"
+
+        return None
diff --git a/mm_agents/coact/autogen/interop/interoperability.py b/mm_agents/coact/autogen/interop/interoperability.py
new file mode 100644
index 0000000..f76d38c
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/interoperability.py
@@ -0,0 +1,71 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+from typing import Any
+
+from ..doc_utils import export_module
+from ..tools import Tool
+from .interoperable import Interoperable
+from .registry import InteroperableRegistry
+
+__all__ = ["Interoperable"]
+
+
+@export_module("autogen.interop")
+class Interoperability:
+    """A class to handle interoperability between different tool types.
+
+    This class allows the conversion of tools to various interoperability classes and provides functionality
+    for retrieving and registering interoperability classes.
+    """
+
+    registry = InteroperableRegistry.get_instance()
+
+    @classmethod
+    def convert_tool(cls, *, tool: Any, type: str, **kwargs: Any) -> Tool:
+        """Converts a given tool to an instance of a specified interoperability type.
+
+        Args:
+            tool (Any): The tool object to be converted.
+            type (str): The type of interoperability to convert the tool to.
+            **kwargs (Any): Additional arguments to be passed during conversion.
+
+        Returns:
+            Tool: The converted tool.
+
+        Raises:
+            ValueError: If the interoperability class for the provided type is not found.
+        """
+        interop = cls.get_interoperability_class(type)
+        return interop.convert_tool(tool, **kwargs)
+
+    @classmethod
+    def get_interoperability_class(cls, type: str) -> type[Interoperable]:
+        """Retrieves the interoperability class corresponding to the specified type.
+
+        Args:
+            type (str): The type of the interoperability class to retrieve.
+
+        Returns:
+            type[Interoperable]: The interoperability class type.
+
+        Raises:
+            ValueError: If no interoperability class is found for the provided type.
+        """
+        supported_types = cls.registry.get_supported_types()
+        if type not in supported_types:
+            supported_types_formatted = ", ".join(["'t'" for t in supported_types])
+            raise ValueError(
+                f"Interoperability class {type} is not supported, supported types: {supported_types_formatted}"
+            )
+
+        return cls.registry.get_class(type)
+
+    @classmethod
+    def get_supported_types(cls) -> list[str]:
+        """Returns a sorted list of all supported interoperability types.
+
+        Returns:
+            List[str]: A sorted list of strings representing the supported interoperability types.
+        """
+        return sorted(cls.registry.get_supported_types())
diff --git a/mm_agents/coact/autogen/interop/interoperable.py b/mm_agents/coact/autogen/interop/interoperable.py
new file mode 100644
index 0000000..f569047
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/interoperable.py
@@ -0,0 +1,46 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Optional, Protocol, runtime_checkable
+
+from ..doc_utils import export_module
+from ..tools import Tool
+
+__all__ = ["Interoperable"]
+
+
+@runtime_checkable
+@export_module("autogen.interop")
+class Interoperable(Protocol):
+    """A Protocol defining the interoperability interface for tool conversion.
+
+    This protocol ensures that any class implementing it provides the method
+    `convert_tool` to convert a given tool into a desired format or type.
+    """
+
+    @classmethod
+    def convert_tool(cls, tool: Any, **kwargs: Any) -> Tool:
+        """Converts a given tool to a desired format or type.
+
+        This method should be implemented by any class adhering to the `Interoperable` protocol.
+
+        Args:
+            tool (Any): The tool object to be converted.
+            **kwargs (Any): Additional parameters to pass during the conversion process.
+
+        Returns:
+            Tool: The converted tool in the desired format or type.
+        """
+        ...
+
+    @classmethod
+    def get_unsupported_reason(cls) -> Optional[str]:
+        """Returns the reason for the tool being unsupported.
+
+        This method should be implemented by any class adhering to the `Interoperable` protocol.
+
+        Returns:
+            str: The reason for the interoperability class being unsupported.
+        """
+        ...
diff --git a/mm_agents/coact/autogen/interop/langchain/__init__.py b/mm_agents/coact/autogen/interop/langchain/__init__.py
new file mode 100644
index 0000000..b858b04
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/langchain/__init__.py
@@ -0,0 +1,8 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .langchain_chat_model_factory import LangChainChatModelFactory
+from .langchain_tool import LangChainInteroperability
+
+__all__ = ["LangChainChatModelFactory", "LangChainInteroperability"]
diff --git a/mm_agents/coact/autogen/interop/langchain/langchain_chat_model_factory.py b/mm_agents/coact/autogen/interop/langchain/langchain_chat_model_factory.py
new file mode 100644
index 0000000..2aef640
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/langchain/langchain_chat_model_factory.py
@@ -0,0 +1,155 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from abc import ABC, abstractmethod
+from typing import Any, Callable, TypeVar, Union
+
+from ...doc_utils import export_module
+from ...import_utils import optional_import_block, require_optional_import
+from ...llm_config import LLMConfig
+from ...oai import get_first_llm_config
+
+with optional_import_block():
+    from langchain_anthropic import ChatAnthropic
+    from langchain_core.language_models import BaseChatModel
+    from langchain_google_genai import ChatGoogleGenerativeAI
+    from langchain_ollama import ChatOllama
+    from langchain_openai import AzureChatOpenAI, ChatOpenAI
+
+
+__all__ = ["LangChainChatModelFactory"]
+
+T = TypeVar("T", bound="LangChainChatModelFactory")
+
+
+@require_optional_import(
+    ["langchain_anthropic", "langchain_google_genai", "langchain_ollama", "langchain_openai", "langchain_core"],
+    "browser-use",
+    except_for=["__init__", "register_factory"],
+)
+@export_module("autogen.interop")
+class LangChainChatModelFactory(ABC):
+    _factories: set["LangChainChatModelFactory"] = set()
+
+    @classmethod
+    def create_base_chat_model(cls, llm_config: Union[LLMConfig, dict[str, Any]]) -> "BaseChatModel":  # type: ignore [no-any-unimported]
+        first_llm_config = get_first_llm_config(llm_config)
+        for factory in LangChainChatModelFactory._factories:
+            if factory.accepts(first_llm_config):
+                return factory.create(first_llm_config)
+
+        raise ValueError("Could not find a factory for the given config.")
+
+    @classmethod
+    def register_factory(cls) -> Callable[[type[T]], type[T]]:
+        def decorator(factory: type[T]) -> type[T]:
+            cls._factories.add(factory())
+            return factory
+
+        return decorator
+
+    @classmethod
+    def prepare_config(cls, first_llm_config: dict[str, Any]) -> dict[str, Any]:
+        for pop_keys in ["api_type", "response_format"]:
+            first_llm_config.pop(pop_keys, None)
+        return first_llm_config
+
+    @classmethod
+    @abstractmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "BaseChatModel":  # type: ignore [no-any-unimported]
+        ...
+
+    @classmethod
+    @abstractmethod
+    def get_api_type(cls) -> str: ...
+
+    @classmethod
+    def accepts(cls, first_llm_config: dict[str, Any]) -> bool:
+        return first_llm_config.get("api_type", "openai") == cls.get_api_type()  # type: ignore [no-any-return]
+
+
+@LangChainChatModelFactory.register_factory()
+class ChatOpenAIFactory(LangChainChatModelFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "ChatOpenAI":  # type: ignore [no-any-unimported]
+        first_llm_config = cls.prepare_config(first_llm_config)
+
+        return ChatOpenAI(**first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "openai"
+
+
+@LangChainChatModelFactory.register_factory()
+class DeepSeekFactory(ChatOpenAIFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "ChatOpenAI":  # type: ignore [no-any-unimported]
+        if "base_url" not in first_llm_config:
+            raise ValueError("base_url is required for deepseek api type.")
+        return super().create(first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "deepseek"
+
+
+@LangChainChatModelFactory.register_factory()
+class ChatAnthropicFactory(LangChainChatModelFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "ChatAnthropic":  # type: ignore [no-any-unimported]
+        first_llm_config = cls.prepare_config(first_llm_config)
+
+        return ChatAnthropic(**first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "anthropic"
+
+
+@LangChainChatModelFactory.register_factory()
+class ChatGoogleGenerativeAIFactory(LangChainChatModelFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "ChatGoogleGenerativeAI":  # type: ignore [no-any-unimported]
+        first_llm_config = cls.prepare_config(first_llm_config)
+
+        return ChatGoogleGenerativeAI(**first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "google"
+
+
+@LangChainChatModelFactory.register_factory()
+class AzureChatOpenAIFactory(LangChainChatModelFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "AzureChatOpenAI":  # type: ignore [no-any-unimported]
+        first_llm_config = cls.prepare_config(first_llm_config)
+        for param in ["base_url", "api_version"]:
+            if param not in first_llm_config:
+                raise ValueError(f"{param} is required for azure api type.")
+        first_llm_config["azure_endpoint"] = first_llm_config.pop("base_url")
+
+        return AzureChatOpenAI(**first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "azure"
+
+
+@LangChainChatModelFactory.register_factory()
+class ChatOllamaFactory(LangChainChatModelFactory):
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> "ChatOllama":  # type: ignore [no-any-unimported]
+        first_llm_config = cls.prepare_config(first_llm_config)
+        first_llm_config["base_url"] = first_llm_config.pop("client_host", None)
+        if "num_ctx" not in first_llm_config:
+            # In all Browser Use examples, num_ctx is set to 32000
+            first_llm_config["num_ctx"] = 32000
+
+        return ChatOllama(**first_llm_config)
+
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "ollama"
diff --git a/mm_agents/coact/autogen/interop/langchain/langchain_tool.py b/mm_agents/coact/autogen/interop/langchain/langchain_tool.py
new file mode 100644
index 0000000..4186ff0
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/langchain/langchain_tool.py
@@ -0,0 +1,82 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import sys
+from typing import Any, Optional
+
+from ...doc_utils import export_module
+from ...import_utils import optional_import_block, require_optional_import
+from ...tools import Tool
+from ..registry import register_interoperable_class
+
+__all__ = ["LangChainInteroperability"]
+
+with optional_import_block():
+    from langchain_core.tools import BaseTool as LangchainTool
+
+
+@register_interoperable_class("langchain")
+@export_module("autogen.interop")
+class LangChainInteroperability:
+    """A class implementing the `Interoperable` protocol for converting Langchain tools
+    into a general `Tool` format.
+
+    This class takes a `LangchainTool` and converts it into a standard `Tool` object,
+    ensuring compatibility between Langchain tools and other systems that expect
+    the `Tool` format.
+    """
+
+    @classmethod
+    @require_optional_import("langchain_core", "interop-langchain")
+    def convert_tool(cls, tool: Any, **kwargs: Any) -> Tool:
+        """Converts a given Langchain tool into a general `Tool` format.
+
+        This method verifies that the provided tool is a valid `LangchainTool`,
+        processes the tool's input and description, and returns a standardized
+        `Tool` object.
+
+        Args:
+            tool (Any): The tool to convert, expected to be an instance of `LangchainTool`.
+            **kwargs (Any): Additional arguments, which are not supported by this method.
+
+        Returns:
+            Tool: A standardized `Tool` object converted from the Langchain tool.
+
+        Raises:
+            ValueError: If the provided tool is not an instance of `LangchainTool`, or if
+                        any additional arguments are passed.
+        """
+        if not isinstance(tool, LangchainTool):
+            raise ValueError(f"Expected an instance of `langchain_core.tools.BaseTool`, got {type(tool)}")
+        if kwargs:
+            raise ValueError(f"The LangchainInteroperability does not support any additional arguments, got {kwargs}")
+
+        # needed for type checking
+        langchain_tool: LangchainTool = tool  # type: ignore[no-any-unimported]
+
+        model_type = langchain_tool.get_input_schema()
+
+        def func(tool_input: model_type) -> Any:  # type: ignore[valid-type]
+            return langchain_tool.run(tool_input.model_dump())  # type: ignore[attr-defined]
+
+        return Tool(
+            name=langchain_tool.name,
+            description=langchain_tool.description,
+            func_or_tool=func,
+        )
+
+    @classmethod
+    def get_unsupported_reason(cls) -> Optional[str]:
+        if sys.version_info < (3, 9):
+            return "This submodule is only supported for Python versions 3.9 and above"
+
+        with optional_import_block() as result:
+            import langchain_core.tools  # noqa: F401
+
+        if not result.is_successful:
+            return (
+                "Please install `interop-langchain` extra to use this module:\n\n\tpip install ag2[interop-langchain]"
+            )
+
+        return None
diff --git a/mm_agents/coact/autogen/interop/litellm/__init__.py b/mm_agents/coact/autogen/interop/litellm/__init__.py
new file mode 100644
index 0000000..5151695
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/litellm/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .litellm_config_factory import LiteLLmConfigFactory
+
+__all__ = ["LiteLLmConfigFactory"]
diff --git a/mm_agents/coact/autogen/interop/litellm/litellm_config_factory.py b/mm_agents/coact/autogen/interop/litellm/litellm_config_factory.py
new file mode 100644
index 0000000..0d939e6
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/litellm/litellm_config_factory.py
@@ -0,0 +1,179 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import os
+from abc import ABC, abstractmethod
+from typing import Any, Callable, Optional, TypeVar, Union
+
+from ...doc_utils import export_module
+from ...llm_config import LLMConfig
+from ...oai import get_first_llm_config
+
+__all__ = ["LiteLLmConfigFactory"]
+
+T = TypeVar("T", bound="LiteLLmConfigFactory")
+
+
+def get_crawl4ai_version() -> Optional[str]:
+    """Get the installed crawl4ai version."""
+    try:
+        import crawl4ai
+
+        version = getattr(crawl4ai, "__version__", None)
+        return version if isinstance(version, str) else None
+    except (ImportError, AttributeError):
+        return None
+
+
+def is_crawl4ai_v05_or_higher() -> bool:
+    """Check if crawl4ai version is 0.5 or higher."""
+    version = get_crawl4ai_version()
+    if version is None:
+        return False
+
+    # Parse version string (e.g., "0.5.0" -> [0, 5, 0])
+    try:
+        version_parts = [int(x) for x in version.split(".")]
+        # Check if version >= 0.5.0
+        return version_parts >= [0, 5, 0]
+    except (ValueError, IndexError):
+        return False
+
+
+@export_module("autogen.interop")
+class LiteLLmConfigFactory(ABC):
+    _factories: set["LiteLLmConfigFactory"] = set()
+
+    @classmethod
+    def create_lite_llm_config(cls, llm_config: Union[LLMConfig, dict[str, Any]]) -> dict[str, Any]:
+        """
+        Create a lite LLM config compatible with the installed crawl4ai version.
+
+        For crawl4ai >=0.5: Returns config with llmConfig parameter
+        For crawl4ai <0.5: Returns config with provider parameter (legacy)
+        """
+        first_llm_config = get_first_llm_config(llm_config)
+        for factory in LiteLLmConfigFactory._factories:
+            if factory.accepts(first_llm_config):
+                base_config = factory.create(first_llm_config)
+
+                # Check crawl4ai version and adapt config accordingly
+                if is_crawl4ai_v05_or_higher():
+                    return cls._adapt_for_crawl4ai_v05(base_config)
+                else:
+                    return base_config  # Use legacy format
+
+        raise ValueError("Could not find a factory for the given config.")
+
+    @classmethod
+    def _adapt_for_crawl4ai_v05(cls, base_config: dict[str, Any]) -> dict[str, Any]:
+        """
+        Adapt the config for crawl4ai >=0.5 by moving deprecated parameters
+        into an llmConfig object.
+        """
+        adapted_config = base_config.copy()
+
+        # Extract deprecated parameters
+        llm_config_params = {}
+
+        if "provider" in adapted_config:
+            llm_config_params["provider"] = adapted_config.pop("provider")
+
+        if "api_token" in adapted_config:
+            llm_config_params["api_token"] = adapted_config.pop("api_token")
+
+        # Add other parameters that should be in llmConfig
+        for param in ["base_url", "api_base", "api_version"]:
+            if param in adapted_config:
+                llm_config_params[param] = adapted_config.pop(param)
+
+        # Create the llmConfig object if we have parameters for it
+        if llm_config_params:
+            adapted_config["llmConfig"] = llm_config_params
+
+        return adapted_config
+
+    @classmethod
+    def register_factory(cls) -> Callable[[type[T]], type[T]]:
+        def decorator(factory: type[T]) -> type[T]:
+            cls._factories.add(factory())
+            return factory
+
+        return decorator
+
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> dict[str, Any]:
+        model = first_llm_config.pop("model")
+        api_type = first_llm_config.pop("api_type", "openai")
+
+        first_llm_config["provider"] = f"{api_type}/{model}"
+        return first_llm_config
+
+    @classmethod
+    @abstractmethod
+    def get_api_type(cls) -> str: ...
+
+    @classmethod
+    def accepts(cls, first_llm_config: dict[str, Any]) -> bool:
+        return first_llm_config.get("api_type", "openai") == cls.get_api_type()  # type: ignore [no-any-return]
+
+
+@LiteLLmConfigFactory.register_factory()
+class DefaultLiteLLmConfigFactory(LiteLLmConfigFactory):
+    @classmethod
+    def get_api_type(cls) -> str:
+        raise NotImplementedError("DefaultLiteLLmConfigFactory does not have an API type.")
+
+    @classmethod
+    def accepts(cls, first_llm_config: dict[str, Any]) -> bool:
+        non_base_api_types = ["google", "ollama"]
+        return first_llm_config.get("api_type", "openai") not in non_base_api_types
+
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> dict[str, Any]:
+        api_type = first_llm_config.get("api_type", "openai")
+        if api_type != "openai" and "api_key" not in first_llm_config:
+            raise ValueError("API key is required.")
+        first_llm_config["api_token"] = first_llm_config.pop("api_key", os.getenv("OPENAI_API_KEY"))
+
+        first_llm_config = super().create(first_llm_config)
+
+        return first_llm_config
+
+
+@LiteLLmConfigFactory.register_factory()
+class GoogleLiteLLmConfigFactory(LiteLLmConfigFactory):
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "google"
+
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> dict[str, Any]:
+        # api type must be changed before calling super().create
+        # litellm uses gemini as the api type for google
+        first_llm_config["api_type"] = "gemini"
+        first_llm_config["api_token"] = first_llm_config.pop("api_key")
+        first_llm_config = super().create(first_llm_config)
+
+        return first_llm_config
+
+    @classmethod
+    def accepts(cls, first_llm_config: dict[str, Any]) -> bool:
+        api_type: str = first_llm_config.get("api_type", "")
+        return api_type == cls.get_api_type() or api_type == "gemini"
+
+
+@LiteLLmConfigFactory.register_factory()
+class OllamaLiteLLmConfigFactory(LiteLLmConfigFactory):
+    @classmethod
+    def get_api_type(cls) -> str:
+        return "ollama"
+
+    @classmethod
+    def create(cls, first_llm_config: dict[str, Any]) -> dict[str, Any]:
+        first_llm_config = super().create(first_llm_config)
+        if "client_host" in first_llm_config:
+            first_llm_config["api_base"] = first_llm_config.pop("client_host")
+
+        return first_llm_config
diff --git a/mm_agents/coact/autogen/interop/pydantic_ai/__init__.py b/mm_agents/coact/autogen/interop/pydantic_ai/__init__.py
new file mode 100644
index 0000000..a8c0302
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/pydantic_ai/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .pydantic_ai import PydanticAIInteroperability
+
+__all__ = ["PydanticAIInteroperability"]
diff --git a/mm_agents/coact/autogen/interop/pydantic_ai/pydantic_ai.py b/mm_agents/coact/autogen/interop/pydantic_ai/pydantic_ai.py
new file mode 100644
index 0000000..90190a0
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/pydantic_ai/pydantic_ai.py
@@ -0,0 +1,168 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import sys
+import warnings
+from functools import wraps
+from inspect import signature
+from typing import Any, Callable, Optional
+
+from ...doc_utils import export_module
+from ...import_utils import optional_import_block, require_optional_import
+from ...tools import Tool
+from ..registry import register_interoperable_class
+
+__all__ = ["PydanticAIInteroperability"]
+
+with optional_import_block():
+    from pydantic_ai import RunContext
+    from pydantic_ai.tools import Tool as PydanticAITool
+    from pydantic_ai.usage import Usage
+
+
+@register_interoperable_class("pydanticai")
+@export_module("autogen.interop")
+class PydanticAIInteroperability:
+    """A class implementing the `Interoperable` protocol for converting Pydantic AI tools
+    into a general `Tool` format.
+
+    This class takes a `PydanticAITool` and converts it into a standard `Tool` object,
+    ensuring compatibility between Pydantic AI tools and other systems that expect
+    the `Tool` format. It also provides a mechanism for injecting context parameters
+    into the tool's function.
+    """
+
+    @staticmethod
+    @require_optional_import("pydantic_ai", "interop-pydantic-ai")
+    def inject_params(
+        ctx: Any,
+        tool: Any,
+    ) -> Callable[..., Any]:
+        """Wraps the tool's function to inject context parameters and handle retries.
+
+        This method ensures that context parameters are properly passed to the tool
+        when invoked and that retries are managed according to the tool's settings.
+
+        Args:
+            ctx (Optional[RunContext[Any]]): The run context, which may include dependencies and retry information.
+            tool (PydanticAITool): The Pydantic AI tool whose function is to be wrapped.
+
+        Returns:
+            Callable[..., Any]: A wrapped function that includes context injection and retry handling.
+
+        Raises:
+            ValueError: If the tool fails after the maximum number of retries.
+        """
+        ctx_typed: Optional[RunContext[Any]] = ctx  # type: ignore[no-any-unimported]
+        tool_typed: PydanticAITool[Any] = tool  # type: ignore[no-any-unimported]
+
+        max_retries = tool_typed.max_retries if tool_typed.max_retries is not None else 1
+        f = tool_typed.function
+
+        @wraps(f)
+        def wrapper(*args: Any, **kwargs: Any) -> Any:
+            if tool_typed.current_retry >= max_retries:
+                raise ValueError(f"{tool_typed.name} failed after {max_retries} retries")
+
+            try:
+                if ctx_typed is not None:
+                    kwargs.pop("ctx", None)
+                    ctx_typed.retry = tool_typed.current_retry
+                    result = f(**kwargs, ctx=ctx_typed)  # type: ignore[call-arg]
+                else:
+                    result = f(**kwargs)  # type: ignore[call-arg]
+                tool_typed.current_retry = 0
+            except Exception as e:
+                tool_typed.current_retry += 1
+                raise e
+
+            return result
+
+        sig = signature(f)
+        if ctx_typed is not None:
+            new_params = [param for name, param in sig.parameters.items() if name != "ctx"]
+        else:
+            new_params = list(sig.parameters.values())
+
+        wrapper.__signature__ = sig.replace(parameters=new_params)  # type: ignore[attr-defined]
+
+        return wrapper
+
+    @classmethod
+    @require_optional_import("pydantic_ai", "interop-pydantic-ai")
+    def convert_tool(cls, tool: Any, deps: Any = None, **kwargs: Any) -> Tool:
+        """Converts a given Pydantic AI tool into a general `Tool` format.
+
+        This method verifies that the provided tool is a valid `PydanticAITool`,
+        handles context dependencies if necessary, and returns a standardized `Tool` object.
+
+        Args:
+            tool (Any): The tool to convert, expected to be an instance of `PydanticAITool`.
+            deps (Any, optional): The dependencies to inject into the context, required if
+                                   the tool takes a context. Defaults to None.
+            **kwargs (Any): Additional arguments that are not used in this method.
+
+        Returns:
+            Tool: A standardized `Tool` object converted from the Pydantic AI tool.
+
+        Raises:
+            ValueError: If the provided tool is not an instance of `PydanticAITool`, or if
+                        dependencies are missing for tools that require a context.
+            UserWarning: If the `deps` argument is provided for a tool that does not take a context.
+        """
+        if not isinstance(tool, PydanticAITool):
+            raise ValueError(f"Expected an instance of `pydantic_ai.tools.Tool`, got {type(tool)}")
+
+        # needed for type checking
+        pydantic_ai_tool: PydanticAITool[Any] = tool  # type: ignore[no-any-unimported]
+
+        if tool.takes_ctx and deps is None:
+            raise ValueError("If the tool takes a context, the `deps` argument must be provided")
+        if not tool.takes_ctx and deps is not None:
+            warnings.warn(
+                "The `deps` argument is provided but will be ignored because the tool does not take a context.",
+                UserWarning,
+            )
+
+        ctx = (
+            RunContext(
+                model=None,  # type: ignore [arg-type]
+                usage=Usage(),
+                prompt="",
+                deps=deps,
+                retry=0,
+                # All messages send to or returned by a model.
+                # This is mostly used on pydantic_ai Agent level.
+                messages=[],  # TODO: check in the future if this is needed on Tool level
+                tool_name=pydantic_ai_tool.name,
+            )
+            if tool.takes_ctx
+            else None
+        )
+
+        func = PydanticAIInteroperability.inject_params(
+            ctx=ctx,
+            tool=pydantic_ai_tool,
+        )
+
+        return Tool(
+            name=pydantic_ai_tool.name,
+            description=pydantic_ai_tool.description,
+            func_or_tool=func,
+            parameters_json_schema=pydantic_ai_tool._parameters_json_schema,
+        )
+
+    @classmethod
+    def get_unsupported_reason(cls) -> Optional[str]:
+        if sys.version_info < (3, 9):
+            return "This submodule is only supported for Python versions 3.9 and above"
+
+        with optional_import_block() as result:
+            import pydantic_ai.tools  # noqa: F401
+
+        if not result.is_successful:
+            return "Please install `interop-pydantic-ai` extra to use this module:\n\n\tpip install ag2[interop-pydantic-ai]"
+
+        return None
diff --git a/mm_agents/coact/autogen/interop/registry.py b/mm_agents/coact/autogen/interop/registry.py
new file mode 100644
index 0000000..d24f310
--- /dev/null
+++ b/mm_agents/coact/autogen/interop/registry.py
@@ -0,0 +1,69 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Callable, TypeVar
+
+from ..doc_utils import export_module
+from .interoperable import Interoperable
+
+__all__ = ["InteroperableRegistry", "register_interoperable_class"]
+
+InteroperableClass = TypeVar("InteroperableClass", bound=type[Interoperable])
+
+
+class InteroperableRegistry:
+    def __init__(self) -> None:
+        self._registry: dict[str, type[Interoperable]] = {}
+
+    def register(self, short_name: str, cls: InteroperableClass) -> InteroperableClass:
+        if short_name in self._registry:
+            raise ValueError(f"Duplicate registration for {short_name}")
+
+        self._registry[short_name] = cls
+
+        return cls
+
+    def get_short_names(self) -> list[str]:
+        return sorted(self._registry.keys())
+
+    def get_supported_types(self) -> list[str]:
+        short_names = self.get_short_names()
+        supported_types = [name for name in short_names if self._registry[name].get_unsupported_reason() is None]
+        return supported_types
+
+    def get_class(self, short_name: str) -> type[Interoperable]:
+        return self._registry[short_name]
+
+    @classmethod
+    def get_instance(cls) -> "InteroperableRegistry":
+        return _register
+
+
+# global registry
+_register = InteroperableRegistry()
+
+
+# register decorator
+@export_module("autogen.interop")
+def register_interoperable_class(short_name: str) -> Callable[[InteroperableClass], InteroperableClass]:
+    """Register an Interoperable class in the global registry.
+
+    Returns:
+        Callable[[InteroperableClass], InteroperableClass]: Decorator function
+
+    Example:
+        ```python
+        @register_interoperable_class("myinterop")
+        class MyInteroperability(Interoperable):
+            def convert_tool(self, tool: Any) -> Tool:
+                # implementation
+                ...
+        ```
+    """
+
+    def inner(cls: InteroperableClass) -> InteroperableClass:
+        global _register
+        return _register.register(short_name, cls)
+
+    return inner
diff --git a/mm_agents/coact/autogen/io/__init__.py b/mm_agents/coact/autogen/io/__init__.py
new file mode 100644
index 0000000..eb55023
--- /dev/null
+++ b/mm_agents/coact/autogen/io/__init__.py
@@ -0,0 +1,15 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from .base import IOStream, InputStream, OutputStream
+from .console import IOConsole
+from .websockets import IOWebsockets
+
+# Set the default input/output stream to the console
+IOStream.set_global_default(IOConsole())
+IOStream.set_default(IOConsole())
+
+__all__ = ("IOConsole", "IOStream", "IOWebsockets", "InputStream", "OutputStream")
diff --git a/mm_agents/coact/autogen/io/base.py b/mm_agents/coact/autogen/io/base.py
new file mode 100644
index 0000000..e978adf
--- /dev/null
+++ b/mm_agents/coact/autogen/io/base.py
@@ -0,0 +1,151 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import logging
+from collections.abc import Iterator
+from contextlib import contextmanager
+from contextvars import ContextVar
+from typing import Any, Optional, Protocol, Union, runtime_checkable
+
+from ..doc_utils import export_module
+from ..events.base_event import BaseEvent
+
+__all__ = ("IOStream", "InputStream", "OutputStream")
+
+logger = logging.getLogger(__name__)
+
+
+@runtime_checkable
+@export_module("autogen.io")
+class OutputStream(Protocol):
+    def print(self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False) -> None:
+        """Print data to the output stream.
+
+        Args:
+            objects (any): The data to print.
+            sep (str, optional): The separator between objects. Defaults to " ".
+            end (str, optional): The end of the output. Defaults to "\n".
+            flush (bool, optional): Whether to flush the output. Defaults to False.
+        """
+        ...  # pragma: no cover
+
+    def send(self, message: BaseEvent) -> None:
+        """Send data to the output stream.
+
+        Args:
+            message (BaseEvent): BaseEvent from autogen.messages.base_message
+        """
+        ...
+
+
+@runtime_checkable
+@export_module("autogen.io")
+class InputStream(Protocol):
+    def input(self, prompt: str = "", *, password: bool = False) -> str:
+        """Read a line from the input stream.
+
+        Args:
+            prompt (str, optional): The prompt to display. Defaults to "".
+            password (bool, optional): Whether to read a password. Defaults to False.
+
+        Returns:
+            str: The line read from the input stream.
+
+        """
+        ...  # pragma: no cover
+
+
+@runtime_checkable
+@export_module("autogen.io")
+class AsyncInputStream(Protocol):
+    async def input(self, prompt: str = "", *, password: bool = False) -> str:
+        """Read a line from the input stream.
+
+        Args:
+            prompt (str, optional): The prompt to display. Defaults to "".
+            password (bool, optional): Whether to read a password. Defaults to False.
+
+        Returns:
+            str: The line read from the input stream.
+
+        """
+        ...  # pragma: no cover
+
+
+@runtime_checkable
+@export_module("autogen.io")
+class IOStreamProtocol(InputStream, OutputStream, Protocol):
+    """A protocol for input/output streams."""
+
+
+@runtime_checkable
+@export_module("autogen.io")
+class AsyncIOStreamProtocol(AsyncInputStream, OutputStream, Protocol):
+    """A protocol for input/output streams."""
+
+
+iostream_union = Union[IOStreamProtocol, AsyncIOStreamProtocol]
+
+
+@export_module("autogen.io")
+class IOStream:
+    """A protocol for input/output streams."""
+
+    # ContextVar must be used in multithreaded or async environments
+    _default_io_stream: ContextVar[Optional[iostream_union]] = ContextVar("default_iostream", default=None)
+    _default_io_stream.set(None)
+    _global_default: Optional[iostream_union] = None
+
+    @staticmethod
+    def set_global_default(stream: iostream_union) -> None:
+        """Set the default input/output stream.
+
+        Args:
+            stream (IOStream): The input/output stream to set as the default.
+        """
+        IOStream._global_default = stream
+
+    @staticmethod
+    def get_global_default() -> iostream_union:
+        """Get the default input/output stream.
+
+        Returns:
+            IOStream: The default input/output stream.
+        """
+        if IOStream._global_default is None:
+            raise RuntimeError("No global default IOStream has been set")
+        return IOStream._global_default
+
+    @staticmethod
+    def get_default() -> iostream_union:
+        """Get the default input/output stream.
+
+        Returns:
+            IOStream: The default input/output stream.
+        """
+        iostream = IOStream._default_io_stream.get()
+        if iostream is None:
+            iostream = IOStream.get_global_default()
+            # Set the default IOStream of the current context (thread/cooroutine)
+            IOStream.set_default(iostream)
+        return iostream
+
+    @staticmethod
+    @contextmanager
+    def set_default(stream: Optional[iostream_union]) -> Iterator[None]:
+        """Set the default input/output stream.
+
+        Args:
+            stream (IOStream): The input/output stream to set as the default.
+        """
+        global _default_io_stream
+        try:
+            token = IOStream._default_io_stream.set(stream)
+            yield
+        finally:
+            IOStream._default_io_stream.reset(token)
+
+        return
diff --git a/mm_agents/coact/autogen/io/console.py b/mm_agents/coact/autogen/io/console.py
new file mode 100644
index 0000000..45bc8bd
--- /dev/null
+++ b/mm_agents/coact/autogen/io/console.py
@@ -0,0 +1,56 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import getpass
+from typing import Any
+
+from ..doc_utils import export_module
+from ..events.base_event import BaseEvent
+from ..events.print_event import PrintEvent
+from .base import IOStream
+
+__all__ = ("IOConsole",)
+
+
+@export_module("autogen.io")
+class IOConsole(IOStream):
+    """A console input/output stream."""
+
+    def print(self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False) -> None:
+        """Print data to the output stream.
+
+        Args:
+            objects (any): The data to print.
+            sep (str, optional): The separator between objects. Defaults to " ".
+            end (str, optional): The end of the output. Defaults to "\n".
+            flush (bool, optional): Whether to flush the output. Defaults to False.
+        """
+        print_message = PrintEvent(*objects, sep=sep, end=end)
+        self.send(print_message)
+        # print(*objects, sep=sep, end=end, flush=flush)
+
+    def send(self, message: BaseEvent) -> None:
+        """Send a message to the output stream.
+
+        Args:
+            message (Any): The message to send.
+        """
+        message.print()
+
+    def input(self, prompt: str = "", *, password: bool = False) -> str:
+        """Read a line from the input stream.
+
+        Args:
+            prompt (str, optional): The prompt to display. Defaults to "".
+            password (bool, optional): Whether to read a password. Defaults to False.
+
+        Returns:
+            str: The line read from the input stream.
+
+        """
+        if password:
+            return getpass.getpass(prompt if prompt != "" else "Password: ")
+        return input(prompt)
diff --git a/mm_agents/coact/autogen/io/processors/__init__.py b/mm_agents/coact/autogen/io/processors/__init__.py
new file mode 100644
index 0000000..1bb6d78
--- /dev/null
+++ b/mm_agents/coact/autogen/io/processors/__init__.py
@@ -0,0 +1,12 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+from .base import AsyncEventProcessorProtocol, EventProcessorProtocol
+from .console_event_processor import AsyncConsoleEventProcessor, ConsoleEventProcessor
+
+__all__ = [
+    "AsyncConsoleEventProcessor",
+    "AsyncEventProcessorProtocol",
+    "ConsoleEventProcessor",
+    "EventProcessorProtocol",
+]
diff --git a/mm_agents/coact/autogen/io/processors/base.py b/mm_agents/coact/autogen/io/processors/base.py
new file mode 100644
index 0000000..d7a3364
--- /dev/null
+++ b/mm_agents/coact/autogen/io/processors/base.py
@@ -0,0 +1,21 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+from typing import TYPE_CHECKING, Protocol
+
+from ...doc_utils import export_module
+
+if TYPE_CHECKING:
+    from ..run_response import AsyncRunResponseProtocol, RunResponseProtocol
+
+__all__ = ["AsyncEventProcessorProtocol", "EventProcessorProtocol"]
+
+
+@export_module("autogen.io")
+class EventProcessorProtocol(Protocol):
+    def process(self, response: "RunResponseProtocol") -> None: ...
+
+
+@export_module("autogen.io")
+class AsyncEventProcessorProtocol(Protocol):
+    async def process(self, response: "AsyncRunResponseProtocol") -> None: ...
diff --git a/mm_agents/coact/autogen/io/processors/console_event_processor.py b/mm_agents/coact/autogen/io/processors/console_event_processor.py
new file mode 100644
index 0000000..f3b57ea
--- /dev/null
+++ b/mm_agents/coact/autogen/io/processors/console_event_processor.py
@@ -0,0 +1,56 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+import getpass
+from typing import TYPE_CHECKING
+
+from ...doc_utils import export_module
+from ...events.agent_events import InputRequestEvent
+from ...events.base_event import BaseEvent
+
+if TYPE_CHECKING:
+    from ..run_response import AsyncRunResponseProtocol, RunResponseProtocol
+    from .base import AsyncEventProcessorProtocol, EventProcessorProtocol
+
+
+@export_module("autogen.io")
+class ConsoleEventProcessor:
+    def process(self, response: "RunResponseProtocol") -> None:
+        for event in response.events:
+            self.process_event(event)
+
+    def process_event(self, event: BaseEvent) -> None:
+        if isinstance(event, InputRequestEvent):
+            prompt = event.content.prompt  # type: ignore[attr-defined]
+            if event.content.password:  # type: ignore[attr-defined]
+                result = getpass.getpass(prompt if prompt != "" else "Password: ")
+            result = input(prompt)
+            event.content.respond(result)  # type: ignore[attr-defined]
+        else:
+            event.print()
+
+
+@export_module("autogen.io")
+class AsyncConsoleEventProcessor:
+    async def process(self, response: "AsyncRunResponseProtocol") -> None:
+        async for event in response.events:
+            await self.process_event(event)
+
+    async def process_event(self, event: BaseEvent) -> None:
+        if isinstance(event, InputRequestEvent):
+            prompt = event.content.prompt  # type: ignore[attr-defined]
+            if event.content.password:  # type: ignore[attr-defined]
+                result = getpass.getpass(prompt if prompt != "" else "Password: ")
+            result = input(prompt)
+            await event.content.respond(result)  # type: ignore[attr-defined]
+        else:
+            event.print()
+
+
+if TYPE_CHECKING:
+
+    def check_type_1(x: ConsoleEventProcessor) -> EventProcessorProtocol:
+        return x
+
+    def check_type_2(x: AsyncConsoleEventProcessor) -> AsyncEventProcessorProtocol:
+        return x
diff --git a/mm_agents/coact/autogen/io/run_response.py b/mm_agents/coact/autogen/io/run_response.py
new file mode 100644
index 0000000..a1e47d9
--- /dev/null
+++ b/mm_agents/coact/autogen/io/run_response.py
@@ -0,0 +1,293 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import queue
+from asyncio import Queue as AsyncQueue
+from typing import Any, AsyncIterable, Dict, Iterable, Optional, Protocol, Sequence, Union
+from uuid import UUID, uuid4
+
+from pydantic import BaseModel, Field
+
+from autogen.tools.tool import Tool
+
+from ..agentchat.agent import Agent, LLMMessageType
+from ..agentchat.group.context_variables import ContextVariables
+from ..events.agent_events import ErrorEvent, InputRequestEvent, RunCompletionEvent
+from ..events.base_event import BaseEvent
+from .processors import (
+    AsyncConsoleEventProcessor,
+    AsyncEventProcessorProtocol,
+    ConsoleEventProcessor,
+    EventProcessorProtocol,
+)
+from .thread_io_stream import AsyncThreadIOStream, ThreadIOStream
+
+Message = dict[str, Any]
+
+
+class RunInfoProtocol(Protocol):
+    @property
+    def uuid(self) -> UUID: ...
+
+    @property
+    def above_run(self) -> Optional["RunResponseProtocol"]: ...
+
+
+class Usage(BaseModel):
+    cost: float
+    prompt_tokens: int
+    completion_tokens: int
+    total_tokens: int
+
+
+class CostBreakdown(BaseModel):
+    total_cost: float
+    models: Dict[str, Usage] = Field(default_factory=dict)
+
+    @classmethod
+    def from_raw(cls, data: dict[str, Any]) -> "CostBreakdown":
+        # Extract total cost
+        total_cost = data.get("total_cost", 0.0)
+
+        # Remove total_cost key to extract models
+        model_usages = {k: Usage(**v) for k, v in data.items() if k != "total_cost"}
+
+        return cls(total_cost=total_cost, models=model_usages)
+
+
+class Cost(BaseModel):
+    usage_including_cached_inference: CostBreakdown
+    usage_excluding_cached_inference: CostBreakdown
+
+    @classmethod
+    def from_raw(cls, data: dict[str, Any]) -> "Cost":
+        return cls(
+            usage_including_cached_inference=CostBreakdown.from_raw(data.get("usage_including_cached_inference", {})),
+            usage_excluding_cached_inference=CostBreakdown.from_raw(data.get("usage_excluding_cached_inference", {})),
+        )
+
+
+class RunResponseProtocol(RunInfoProtocol, Protocol):
+    @property
+    def events(self) -> Iterable[BaseEvent]: ...
+
+    @property
+    def messages(self) -> Iterable[Message]: ...
+
+    @property
+    def summary(self) -> Optional[str]: ...
+
+    @property
+    def context_variables(self) -> Optional[ContextVariables]: ...
+
+    @property
+    def last_speaker(self) -> Optional[str]: ...
+
+    @property
+    def cost(self) -> Optional[Cost]: ...
+
+    def process(self, processor: Optional[EventProcessorProtocol] = None) -> None: ...
+
+    def set_ui_tools(self, tools: list[Tool]) -> None: ...
+
+
+class AsyncRunResponseProtocol(RunInfoProtocol, Protocol):
+    @property
+    def events(self) -> AsyncIterable[BaseEvent]: ...
+
+    @property
+    async def messages(self) -> Iterable[Message]: ...
+
+    @property
+    async def summary(self) -> Optional[str]: ...
+
+    @property
+    async def context_variables(self) -> Optional[ContextVariables]: ...
+
+    @property
+    async def last_speaker(self) -> Optional[str]: ...
+
+    @property
+    async def cost(self) -> Optional[Cost]: ...
+
+    async def process(self, processor: Optional[AsyncEventProcessorProtocol] = None) -> None: ...
+
+    def set_ui_tools(self, tools: list[Tool]) -> None: ...
+
+
+class RunResponse:
+    def __init__(self, iostream: ThreadIOStream, agents: list[Agent]):
+        self.iostream = iostream
+        self.agents = agents
+        self._summary: Optional[str] = None
+        self._messages: Sequence[LLMMessageType] = []
+        self._uuid = uuid4()
+        self._context_variables: Optional[ContextVariables] = None
+        self._last_speaker: Optional[str] = None
+        self._cost: Optional[Cost] = None
+
+    def _queue_generator(self, q: queue.Queue) -> Iterable[BaseEvent]:  # type: ignore[type-arg]
+        """A generator to yield items from the queue until the termination message is found."""
+        while True:
+            try:
+                # Get an item from the queue
+                event = q.get(timeout=0.1)  # Adjust timeout as needed
+
+                if isinstance(event, InputRequestEvent):
+                    event.content.respond = lambda response: self.iostream._output_stream.put(response)  # type: ignore[attr-defined]
+
+                yield event
+
+                if isinstance(event, RunCompletionEvent):
+                    self._messages = event.content.history  # type: ignore[attr-defined]
+                    self._last_speaker = event.content.last_speaker  # type: ignore[attr-defined]
+                    self._summary = event.content.summary  # type: ignore[attr-defined]
+                    self._context_variables = event.content.context_variables  # type: ignore[attr-defined]
+                    self.cost = event.content.cost  # type: ignore[attr-defined]
+                    break
+
+                if isinstance(event, ErrorEvent):
+                    raise event.content.error  # type: ignore[attr-defined]
+            except queue.Empty:
+                continue  # Wait for more items in the queue
+
+    @property
+    def events(self) -> Iterable[BaseEvent]:
+        return self._queue_generator(self.iostream.input_stream)
+
+    @property
+    def messages(self) -> Iterable[Message]:
+        return self._messages
+
+    @property
+    def summary(self) -> Optional[str]:
+        return self._summary
+
+    @property
+    def above_run(self) -> Optional["RunResponseProtocol"]:
+        return None
+
+    @property
+    def uuid(self) -> UUID:
+        return self._uuid
+
+    @property
+    def context_variables(self) -> Optional[ContextVariables]:
+        return self._context_variables
+
+    @property
+    def last_speaker(self) -> Optional[str]:
+        return self._last_speaker
+
+    @property
+    def cost(self) -> Optional[Cost]:
+        return self._cost
+
+    @cost.setter
+    def cost(self, value: Union[Cost, dict[str, Any]]) -> None:
+        if isinstance(value, dict):
+            self._cost = Cost.from_raw(value)
+        else:
+            self._cost = value
+
+    def process(self, processor: Optional[EventProcessorProtocol] = None) -> None:
+        processor = processor or ConsoleEventProcessor()
+        processor.process(self)
+
+    def set_ui_tools(self, tools: list[Tool]) -> None:
+        """Set the UI tools for the agents."""
+        for agent in self.agents:
+            agent.set_ui_tools(tools)
+
+
+class AsyncRunResponse:
+    def __init__(self, iostream: AsyncThreadIOStream, agents: list[Agent]):
+        self.iostream = iostream
+        self.agents = agents
+        self._summary: Optional[str] = None
+        self._messages: Sequence[LLMMessageType] = []
+        self._uuid = uuid4()
+        self._context_variables: Optional[ContextVariables] = None
+        self._last_speaker: Optional[str] = None
+        self._cost: Optional[Cost] = None
+
+    async def _queue_generator(self, q: AsyncQueue[Any]) -> AsyncIterable[BaseEvent]:  # type: ignore[type-arg]
+        """A generator to yield items from the queue until the termination message is found."""
+        while True:
+            try:
+                # Get an item from the queue
+                event = await q.get()
+
+                if isinstance(event, InputRequestEvent):
+
+                    async def respond(response: str) -> None:
+                        await self.iostream._output_stream.put(response)
+
+                    event.content.respond = respond  # type: ignore[attr-defined]
+
+                yield event
+
+                if isinstance(event, RunCompletionEvent):
+                    self._messages = event.content.history  # type: ignore[attr-defined]
+                    self._last_speaker = event.content.last_speaker  # type: ignore[attr-defined]
+                    self._summary = event.content.summary  # type: ignore[attr-defined]
+                    self._context_variables = event.content.context_variables  # type: ignore[attr-defined]
+                    self.cost = event.content.cost  # type: ignore[attr-defined]
+                    break
+
+                if isinstance(event, ErrorEvent):
+                    raise event.content.error  # type: ignore[attr-defined]
+            except queue.Empty:
+                continue
+
+    @property
+    def events(self) -> AsyncIterable[BaseEvent]:
+        return self._queue_generator(self.iostream.input_stream)
+
+    @property
+    async def messages(self) -> Iterable[Message]:
+        return self._messages
+
+    @property
+    async def summary(self) -> Optional[str]:
+        return self._summary
+
+    @property
+    def above_run(self) -> Optional["RunResponseProtocol"]:
+        return None
+
+    @property
+    def uuid(self) -> UUID:
+        return self._uuid
+
+    @property
+    async def context_variables(self) -> Optional[ContextVariables]:
+        return self._context_variables
+
+    @property
+    async def last_speaker(self) -> Optional[str]:
+        return self._last_speaker
+
+    @property
+    async def cost(self) -> Optional[Cost]:
+        return self._cost
+
+    @cost.setter
+    def cost(self, value: Union[Cost, dict[str, Any]]) -> None:
+        if isinstance(value, dict):
+            self._cost = Cost.from_raw(value)
+        else:
+            self._cost = value
+
+    async def process(self, processor: Optional[AsyncEventProcessorProtocol] = None) -> None:
+        processor = processor or AsyncConsoleEventProcessor()
+        await processor.process(self)
+
+    def set_ui_tools(self, tools: list[Tool]) -> None:
+        """Set the UI tools for the agents."""
+        for agent in self.agents:
+            agent.set_ui_tools(tools)
diff --git a/mm_agents/coact/autogen/io/thread_io_stream.py b/mm_agents/coact/autogen/io/thread_io_stream.py
new file mode 100644
index 0000000..bdcc36f
--- /dev/null
+++ b/mm_agents/coact/autogen/io/thread_io_stream.py
@@ -0,0 +1,63 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import queue
+from asyncio import Queue as AsyncQueue
+from typing import TYPE_CHECKING, Any
+
+from autogen.io.base import AsyncIOStreamProtocol, IOStreamProtocol
+
+from ..events.agent_events import InputRequestEvent
+from ..events.print_event import PrintEvent
+
+
+class ThreadIOStream:
+    def __init__(self) -> None:
+        self._input_stream: queue.Queue = queue.Queue()  # type: ignore[type-arg]
+        self._output_stream: queue.Queue = queue.Queue()  # type: ignore[type-arg]
+
+    def input(self, prompt: str = "", *, password: bool = False) -> str:
+        self.send(InputRequestEvent(prompt=prompt, password=password))  # type: ignore[call-arg]
+        return self._output_stream.get()  # type: ignore[no-any-return]
+
+    def print(self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False) -> None:
+        print_message = PrintEvent(*objects, sep=sep, end=end)
+        self.send(print_message)
+
+    def send(self, message: Any) -> None:
+        self._input_stream.put(message)
+
+    @property
+    def input_stream(self) -> queue.Queue:  # type: ignore[type-arg]
+        return self._input_stream
+
+
+class AsyncThreadIOStream:
+    def __init__(self) -> None:
+        self._input_stream: AsyncQueue = AsyncQueue()  # type: ignore[type-arg]
+        self._output_stream: AsyncQueue = AsyncQueue()  # type: ignore[type-arg]
+
+    async def input(self, prompt: str = "", *, password: bool = False) -> str:
+        self.send(InputRequestEvent(prompt=prompt, password=password))  # type: ignore[call-arg]
+        return await self._output_stream.get()  # type: ignore[no-any-return]
+
+    def print(self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False) -> None:
+        print_message = PrintEvent(*objects, sep=sep, end=end)
+        self.send(print_message)
+
+    def send(self, message: Any) -> None:
+        self._input_stream.put_nowait(message)
+
+    @property
+    def input_stream(self) -> AsyncQueue[Any]:
+        return self._input_stream
+
+
+if TYPE_CHECKING:
+
+    def check_type_1(x: ThreadIOStream) -> IOStreamProtocol:
+        return x
+
+    def check_type_2(x: AsyncThreadIOStream) -> AsyncIOStreamProtocol:
+        return x
diff --git a/mm_agents/coact/autogen/io/websockets.py b/mm_agents/coact/autogen/io/websockets.py
new file mode 100644
index 0000000..6c8231b
--- /dev/null
+++ b/mm_agents/coact/autogen/io/websockets.py
@@ -0,0 +1,213 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import logging
+import ssl
+import threading
+from contextlib import contextmanager
+from functools import partial
+from time import sleep
+from typing import Any, Callable, Iterable, Iterator, Optional, Protocol, Union
+
+from ..doc_utils import export_module
+from ..events.base_event import BaseEvent
+from ..events.print_event import PrintEvent
+from ..import_utils import optional_import_block, require_optional_import
+from .base import IOStream
+
+# Check if the websockets module is available
+with optional_import_block():
+    from websockets.sync.server import serve as ws_serve
+
+__all__ = ("IOWebsockets",)
+
+
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)
+
+# The following type and protocols are used to define the ServerConnection and WebSocketServer classes
+# if websockets is not installed, they would be untyped
+Data = Union[str, bytes]
+
+
+class ServerConnection(Protocol):
+    def send(self, message: Union[Data, Iterable[Data]]) -> None:
+        """Send a message to the client.
+
+        Args:
+            message (Union[Data, Iterable[Data]]): The message to send.
+
+        """
+        ...  # pragma: no cover
+
+    def recv(self, timeout: Optional[float] = None) -> Data:
+        """Receive a message from the client.
+
+        Args:
+            timeout (Optional[float], optional): The timeout for the receive operation. Defaults to None.
+
+        Returns:
+            Data: The message received from the client.
+
+        """
+        ...  # pragma: no cover
+
+    def close(self) -> None:
+        """Close the connection."""
+        ...
+
+
+class WebSocketServer(Protocol):
+    def serve_forever(self) -> None:
+        """Run the server forever."""
+        ...  # pragma: no cover
+
+    def shutdown(self) -> None:
+        """Shutdown the server."""
+        ...  # pragma: no cover
+
+    def __enter__(self) -> "WebSocketServer":
+        """Enter the server context."""
+        ...  # pragma: no cover
+
+    def __exit__(self, exc_type: Any, exc_value: Any, traceback: Any) -> None:
+        """Exit the server context."""
+        ...  # pragma: no cover
+
+
+@require_optional_import("websockets", "websockets")
+@export_module("autogen.io")
+class IOWebsockets(IOStream):
+    """A websocket input/output stream."""
+
+    def __init__(self, websocket: ServerConnection) -> None:
+        """Initialize the websocket input/output stream.
+
+        Args:
+            websocket (ServerConnection): The websocket server.
+        """
+        self._websocket = websocket
+
+    @staticmethod
+    def _handler(websocket: ServerConnection, on_connect: Callable[["IOWebsockets"], None]) -> None:
+        """The handler function for the websocket server."""
+        logger.info(f" - IOWebsockets._handler(): Client connected on {websocket}")
+        # create a new IOWebsockets instance using the websocket that is create when a client connects
+        try:
+            iowebsocket = IOWebsockets(websocket)
+            with IOStream.set_default(iowebsocket):
+                # call the on_connect function
+                try:
+                    on_connect(iowebsocket)
+                except Exception as e:
+                    logger.warning(f" - IOWebsockets._handler(): Error in on_connect: {e}")
+        except Exception as e:
+            logger.error(f" - IOWebsockets._handler(): Unexpected error in IOWebsockets: {e}")
+
+    @staticmethod
+    @contextmanager
+    def run_server_in_thread(
+        *,
+        host: str = "127.0.0.1",
+        port: int = 8765,
+        on_connect: Callable[["IOWebsockets"], None],
+        ssl_context: Optional[ssl.SSLContext] = None,
+        **kwargs: Any,
+    ) -> Iterator[str]:
+        """Factory function to create a websocket input/output stream.
+
+        Args:
+            host (str, optional): The host to bind the server to. Defaults to "127.0.0.1".
+            port (int, optional): The port to bind the server to. Defaults to 8765.
+            on_connect (Callable[[IOWebsockets], None]): The function to be executed on client connection. Typically creates agents and initiate chat.
+            ssl_context (Optional[ssl.SSLContext], optional): The SSL context to use for secure connections. Defaults to None.
+            kwargs (Any): Additional keyword arguments to pass to the websocket server.
+
+        Yields:
+            str: The URI of the websocket server.
+        """
+        server_dict: dict[str, WebSocketServer] = {}
+
+        def _run_server() -> None:
+            # print(f" - _run_server(): starting server on ws://{host}:{port}", flush=True)
+            with ws_serve(
+                handler=partial(IOWebsockets._handler, on_connect=on_connect),
+                host=host,
+                port=port,
+                ssl_context=ssl_context,
+                **kwargs,
+            ) as server:
+                # print(f" - _run_server(): server {server} started on ws://{host}:{port}", flush=True)
+
+                server_dict["server"] = server
+
+                # runs until the server is shutdown
+                server.serve_forever()
+
+                return
+
+        # start server in a separate thread
+        thread = threading.Thread(target=_run_server)
+        thread.start()
+        try:
+            while "server" not in server_dict:
+                sleep(0.1)
+
+            yield f"ws://{host}:{port}"
+
+        finally:
+            # print(f" - run_server_in_thread(): shutting down server on ws://{host}:{port}", flush=True)
+            # gracefully stop server
+            if "server" in server_dict:
+                # print(f" - run_server_in_thread(): shutting down server {server_dict['server']}", flush=True)
+                server_dict["server"].shutdown()
+
+            # wait for the thread to stop
+            if thread:
+                thread.join()
+
+    @property
+    def websocket(self) -> "ServerConnection":
+        """The URI of the websocket server."""
+        return self._websocket
+
+    def print(self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False) -> None:
+        """Print data to the output stream.
+
+        Args:
+            objects (any): The data to print.
+            sep (str, optional): The separator between objects. Defaults to " ".
+            end (str, optional): The end of the output. Defaults to "\n".
+            flush (bool, optional): Whether to flush the output. Defaults to False.
+        """
+        print_message = PrintEvent(*objects, sep=sep, end=end)
+        self.send(print_message)
+
+    def send(self, message: BaseEvent) -> None:
+        """Send a message to the output stream.
+
+        Args:
+            message (Any): The message to send.
+        """
+        self._websocket.send(message.model_dump_json())
+
+    def input(self, prompt: str = "", *, password: bool = False) -> str:
+        """Read a line from the input stream.
+
+        Args:
+            prompt (str, optional): The prompt to display. Defaults to "".
+            password (bool, optional): Whether to read a password. Defaults to False.
+
+        Returns:
+            str: The line read from the input stream.
+
+        """
+        if prompt != "":
+            self._websocket.send(prompt)
+
+        msg = self._websocket.recv()
+
+        return msg.decode("utf-8") if isinstance(msg, bytes) else msg
diff --git a/mm_agents/coact/autogen/json_utils.py b/mm_agents/coact/autogen/json_utils.py
new file mode 100644
index 0000000..9805a6e
--- /dev/null
+++ b/mm_agents/coact/autogen/json_utils.py
@@ -0,0 +1,43 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any
+
+from .import_utils import optional_import_block, require_optional_import
+
+with optional_import_block():
+    from jsonschema import Draft7Validator, RefResolver
+
+__all__ = ["resolve_json_references"]
+
+
+@require_optional_import("jsonschema", "gemini")
+def resolve_json_references(schema: dict[str, Any]) -> dict[str, Any]:
+    """
+    Resolve JSON references in the given schema.
+
+    Args:
+        schema (dict): The JSON schema with references.
+
+    Returns:
+        dict: The JSON schema with resolved references.
+    """
+    resolver = RefResolver.from_schema(schema)
+    validator = Draft7Validator(schema, resolver=resolver)
+    resolved_schema = validator.schema
+
+    def resolve_refs(node: Any) -> Any:
+        if isinstance(node, dict):
+            if "$ref" in node:
+                ref = node["$ref"]
+                with resolver.resolving(ref) as resolved:
+                    return resolve_refs(resolved)
+            else:
+                return {k: resolve_refs(v) for k, v in node.items()}
+        elif isinstance(node, list):
+            return [resolve_refs(item) for item in node]
+        else:
+            return node
+
+    return resolve_refs(resolved_schema)  # type: ignore[no-any-return]
diff --git a/mm_agents/coact/autogen/llm_config.py b/mm_agents/coact/autogen/llm_config.py
new file mode 100644
index 0000000..e453dc3
--- /dev/null
+++ b/mm_agents/coact/autogen/llm_config.py
@@ -0,0 +1,382 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import functools
+import json
+import re
+from abc import ABC, abstractmethod
+from collections.abc import Iterable
+from contextvars import ContextVar
+from pathlib import Path
+from typing import TYPE_CHECKING, Annotated, Any, Mapping, Optional, Type, TypeVar, Union
+
+from httpx import Client as httpxClient
+from pydantic import BaseModel, ConfigDict, Field, HttpUrl, SecretStr, ValidationInfo, field_serializer, field_validator
+
+if TYPE_CHECKING:
+    from .oai.client import ModelClient
+
+    _KT = TypeVar("_KT")
+    _VT = TypeVar("_VT")
+
+__all__ = [
+    "LLMConfig",
+    "LLMConfigEntry",
+    "register_llm_config",
+]
+
+
+def _add_default_api_type(d: dict[str, Any]) -> dict[str, Any]:
+    if "api_type" not in d:
+        d["api_type"] = "openai"
+    return d
+
+
+# Meta class to allow LLMConfig.current and LLMConfig.default to be used as class properties
+class MetaLLMConfig(type):
+    def __init__(cls, *args: Any, **kwargs: Any) -> None:
+        pass
+
+    @property
+    def current(cls) -> "LLMConfig":
+        current_llm_config = LLMConfig.get_current_llm_config(llm_config=None)
+        if current_llm_config is None:
+            raise ValueError("No current LLMConfig set. Are you inside a context block?")
+        return current_llm_config  # type: ignore[return-value]
+
+    @property
+    def default(cls) -> "LLMConfig":
+        return cls.current
+
+
+class LLMConfig(metaclass=MetaLLMConfig):
+    _current_llm_config: ContextVar["LLMConfig"] = ContextVar("current_llm_config")
+
+    def __init__(self, **kwargs: Any) -> None:
+        outside_properties = list((self._get_base_model_class()).model_json_schema()["properties"].keys())
+        outside_properties.remove("config_list")
+
+        if "config_list" in kwargs and isinstance(kwargs["config_list"], dict):
+            kwargs["config_list"] = [kwargs["config_list"]]
+
+        modified_kwargs = (
+            kwargs
+            if "config_list" in kwargs
+            else {
+                **{
+                    "config_list": [
+                        {k: v for k, v in kwargs.items() if k not in outside_properties},
+                    ]
+                },
+                **{k: v for k, v in kwargs.items() if k in outside_properties},
+            }
+        )
+
+        modified_kwargs["config_list"] = [
+            _add_default_api_type(v) if isinstance(v, dict) else v for v in modified_kwargs["config_list"]
+        ]
+        for x in ["max_tokens", "top_p"]:
+            if x in modified_kwargs:
+                modified_kwargs["config_list"] = [{**v, x: modified_kwargs[x]} for v in modified_kwargs["config_list"]]
+                modified_kwargs.pop(x)
+
+        self._model = self._get_base_model_class()(**modified_kwargs)
+
+    # used by BaseModel to create instance variables
+    def __enter__(self) -> "LLMConfig":
+        # Store previous context and set self as current
+        self._token = LLMConfig._current_llm_config.set(self)
+        return self
+
+    def __exit__(self, exc_type: Type[Exception], exc_val: Exception, exc_tb: Any) -> None:
+        LLMConfig._current_llm_config.reset(self._token)
+
+    @classmethod
+    def get_current_llm_config(cls, llm_config: "Optional[LLMConfig]" = None) -> "Optional[LLMConfig]":
+        if llm_config is not None:
+            return llm_config
+        try:
+            return (LLMConfig._current_llm_config.get()).copy()
+        except LookupError:
+            return None
+
+    def _satisfies_criteria(self, value: Any, criteria_values: Any) -> bool:
+        if value is None:
+            return False
+
+        if isinstance(value, list):
+            return bool(set(value) & set(criteria_values))  # Non-empty intersection
+        else:
+            return value in criteria_values
+
+    @classmethod
+    def from_json(
+        cls,
+        *,
+        env: Optional[str] = None,
+        path: Optional[Union[str, Path]] = None,
+        file_location: Optional[str] = None,
+        **kwargs: Any,
+    ) -> "LLMConfig":
+        from .oai.openai_utils import config_list_from_json
+
+        if env is None and path is None:
+            raise ValueError("Either 'env' or 'path' must be provided")
+        if env is not None and path is not None:
+            raise ValueError("Only one of 'env' or 'path' can be provided")
+
+        config_list = config_list_from_json(
+            env_or_file=env if env is not None else str(path), file_location=file_location
+        )
+        return LLMConfig(config_list=config_list, **kwargs)
+
+    def where(self, *, exclude: bool = False, **kwargs: Any) -> "LLMConfig":
+        from .oai.openai_utils import filter_config
+
+        filtered_config_list = filter_config(config_list=self.config_list, filter_dict=kwargs, exclude=exclude)
+        if len(filtered_config_list) == 0:
+            raise ValueError(f"No config found that satisfies the filter criteria: {kwargs}")
+
+        kwargs = self.model_dump()
+        kwargs["config_list"] = filtered_config_list
+
+        return LLMConfig(**kwargs)
+
+    # @functools.wraps(BaseModel.model_dump)
+    def model_dump(self, *args: Any, exclude_none: bool = True, **kwargs: Any) -> dict[str, Any]:
+        d = self._model.model_dump(*args, exclude_none=exclude_none, **kwargs)
+        return {k: v for k, v in d.items() if not (isinstance(v, list) and len(v) == 0)}
+
+    # @functools.wraps(BaseModel.model_dump_json)
+    def model_dump_json(self, *args: Any, exclude_none: bool = True, **kwargs: Any) -> str:
+        # return self._model.model_dump_json(*args, exclude_none=exclude_none, **kwargs)
+        d = self.model_dump(*args, exclude_none=exclude_none, **kwargs)
+        return json.dumps(d)
+
+    # @functools.wraps(BaseModel.model_validate)
+    def model_validate(self, *args: Any, **kwargs: Any) -> Any:
+        return self._model.model_validate(*args, **kwargs)
+
+    @functools.wraps(BaseModel.model_validate_json)
+    def model_validate_json(self, *args: Any, **kwargs: Any) -> Any:
+        return self._model.model_validate_json(*args, **kwargs)
+
+    @functools.wraps(BaseModel.model_validate_strings)
+    def model_validate_strings(self, *args: Any, **kwargs: Any) -> Any:
+        return self._model.model_validate_strings(*args, **kwargs)
+
+    def __eq__(self, value: Any) -> bool:
+        return hasattr(value, "_model") and self._model == value._model
+
+    def _getattr(self, o: object, name: str) -> Any:
+        val = getattr(o, name)
+        return val
+
+    def get(self, key: str, default: Optional[Any] = None) -> Any:
+        val = getattr(self._model, key, default)
+        return val
+
+    def __getitem__(self, key: str) -> Any:
+        try:
+            return self._getattr(self._model, key)
+        except AttributeError:
+            raise KeyError(f"Key '{key}' not found in {self.__class__.__name__}")
+
+    def __setitem__(self, key: str, value: Any) -> None:
+        try:
+            setattr(self._model, key, value)
+        except ValueError:
+            raise ValueError(f"'{self.__class__.__name__}' object has no field '{key}'")
+
+    def __getattr__(self, name: Any) -> Any:
+        try:
+            return self._getattr(self._model, name)
+        except AttributeError:
+            raise AttributeError(f"'{self.__class__.__name__}' object has no attribute '{name}'")
+
+    def __setattr__(self, name: str, value: Any) -> None:
+        if name == "_model":
+            object.__setattr__(self, name, value)
+        else:
+            setattr(self._model, name, value)
+
+    def __contains__(self, key: str) -> bool:
+        return hasattr(self._model, key)
+
+    def __repr__(self) -> str:
+        d = self.model_dump()
+        r = [f"{k}={repr(v)}" for k, v in d.items()]
+
+        s = f"LLMConfig({', '.join(r)})"
+        # Replace any keys ending with 'key' or 'token' values with stars for security
+        s = re.sub(
+            r"(['\"])(\w*(key|token))\1:\s*(['\"])([^'\"]*)(?:\4)", r"\1\2\1: \4**********\4", s, flags=re.IGNORECASE
+        )
+        return s
+
+    def __copy__(self) -> "LLMConfig":
+        return LLMConfig(**self.model_dump())
+
+    def __deepcopy__(self, memo: Optional[dict[int, Any]] = None) -> "LLMConfig":
+        return self.__copy__()
+
+    def copy(self) -> "LLMConfig":
+        return self.__copy__()
+
+    def deepcopy(self, memo: Optional[dict[int, Any]] = None) -> "LLMConfig":
+        return self.__deepcopy__(memo)
+
+    def __str__(self) -> str:
+        return repr(self)
+
+    def items(self) -> Iterable[tuple[str, Any]]:
+        d = self.model_dump()
+        return d.items()
+
+    def keys(self) -> Iterable[str]:
+        d = self.model_dump()
+        return d.keys()
+
+    def values(self) -> Iterable[Any]:
+        d = self.model_dump()
+        return d.values()
+
+    _base_model_classes: dict[tuple[Type["LLMConfigEntry"], ...], Type[BaseModel]] = {}
+
+    @classmethod
+    def _get_base_model_class(cls) -> Type["BaseModel"]:
+        def _get_cls(llm_config_classes: tuple[Type[LLMConfigEntry], ...]) -> Type[BaseModel]:
+            if llm_config_classes in LLMConfig._base_model_classes:
+                return LLMConfig._base_model_classes[llm_config_classes]
+
+            class _LLMConfig(BaseModel):
+                temperature: Optional[float] = None
+                check_every_ms: Optional[int] = None
+                max_new_tokens: Optional[int] = None
+                seed: Optional[int] = None
+                allow_format_str_template: Optional[bool] = None
+                response_format: Optional[Union[str, dict[str, Any], BaseModel, Type[BaseModel]]] = None
+                timeout: Optional[int] = None
+                cache_seed: Optional[int] = None
+
+                tools: list[Any] = Field(default_factory=list)
+                functions: list[Any] = Field(default_factory=list)
+                parallel_tool_calls: Optional[bool] = None
+
+                config_list: Annotated[  # type: ignore[valid-type]
+                    list[Annotated[Union[llm_config_classes], Field(discriminator="api_type")]],
+                    Field(default_factory=list, min_length=1),
+                ]
+
+                # Following field is configuration for pydantic to disallow extra fields
+                model_config = ConfigDict(extra="forbid")
+
+            LLMConfig._base_model_classes[llm_config_classes] = _LLMConfig
+
+            return _LLMConfig
+
+        return _get_cls(tuple(_llm_config_classes))
+
+
+class LLMConfigEntry(BaseModel, ABC):
+    api_type: str
+    model: str = Field(..., min_length=1)
+    api_key: Optional[SecretStr] = None
+    api_version: Optional[str] = None
+    max_tokens: Optional[int] = None
+    base_url: Optional[HttpUrl] = None
+    voice: Optional[str] = None
+    model_client_cls: Optional[str] = None
+    http_client: Optional[httpxClient] = None
+    response_format: Optional[Union[str, dict[str, Any], BaseModel, Type[BaseModel]]] = None
+    default_headers: Optional[Mapping[str, Any]] = None
+    tags: list[str] = Field(default_factory=list)
+
+    # Following field is configuration for pydantic to disallow extra fields
+    model_config = ConfigDict(extra="forbid", arbitrary_types_allowed=True)
+
+    @abstractmethod
+    def create_client(self) -> "ModelClient": ...
+
+    @field_validator("base_url", mode="before")
+    @classmethod
+    def check_base_url(cls, v: Any, info: ValidationInfo) -> Any:
+        if not str(v).startswith("https://") and not str(v).startswith("http://"):
+            v = f"http://{str(v)}"
+        return v
+
+    @field_serializer("base_url")
+    def serialize_base_url(self, v: Any) -> Any:
+        return str(v)
+
+    @field_serializer("api_key", when_used="unless-none")
+    def serialize_api_key(self, v: SecretStr) -> Any:
+        return v.get_secret_value()
+
+    def model_dump(self, *args: Any, exclude_none: bool = True, **kwargs: Any) -> dict[str, Any]:
+        return BaseModel.model_dump(self, exclude_none=exclude_none, *args, **kwargs)
+
+    def model_dump_json(self, *args: Any, exclude_none: bool = True, **kwargs: Any) -> str:
+        return BaseModel.model_dump_json(self, exclude_none=exclude_none, *args, **kwargs)
+
+    def get(self, key: str, default: Optional[Any] = None) -> Any:
+        val = getattr(self, key, default)
+        if isinstance(val, SecretStr):
+            return val.get_secret_value()
+        return val
+
+    def __getitem__(self, key: str) -> Any:
+        try:
+            val = getattr(self, key)
+            if isinstance(val, SecretStr):
+                return val.get_secret_value()
+            return val
+        except AttributeError:
+            raise KeyError(f"Key '{key}' not found in {self.__class__.__name__}")
+
+    def __setitem__(self, key: str, value: Any) -> None:
+        setattr(self, key, value)
+
+    def __contains__(self, key: str) -> bool:
+        return hasattr(self, key)
+
+    def items(self) -> Iterable[tuple[str, Any]]:
+        d = self.model_dump()
+        return d.items()
+
+    def keys(self) -> Iterable[str]:
+        d = self.model_dump()
+        return d.keys()
+
+    def values(self) -> Iterable[Any]:
+        d = self.model_dump()
+        return d.values()
+
+    def __repr__(self) -> str:
+        # Override to eliminate none values from the repr
+        d = self.model_dump()
+        r = [f"{k}={repr(v)}" for k, v in d.items()]
+
+        s = f"{self.__class__.__name__}({', '.join(r)})"
+
+        # Replace any keys ending with '_key' or '_token' values with stars for security
+        # This regex will match any key ending with '_key' or '_token' and its value, and replace the value with stars
+        # It also captures the type of quote used (single or double) and reuses it in the replacement
+        s = re.sub(r'(\w+_(key|token)\s*=\s*)([\'"]).*?\3', r"\1\3**********\3", s, flags=re.IGNORECASE)
+
+        return s
+
+    def __str__(self) -> str:
+        return repr(self)
+
+
+_llm_config_classes: list[Type[LLMConfigEntry]] = []
+
+
+def register_llm_config(cls: Type[LLMConfigEntry]) -> Type[LLMConfigEntry]:
+    if isinstance(cls, type) and issubclass(cls, LLMConfigEntry):
+        _llm_config_classes.append(cls)
+    else:
+        raise TypeError(f"Expected a subclass of LLMConfigEntry, got {cls}")
+    return cls
diff --git a/mm_agents/coact/autogen/logger/__init__.py b/mm_agents/coact/autogen/logger/__init__.py
new file mode 100644
index 0000000..ac8c5cc
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/__init__.py
@@ -0,0 +1,11 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from .file_logger import FileLogger
+from .logger_factory import LoggerFactory
+from .sqlite_logger import SqliteLogger
+
+__all__ = ("FileLogger", "LoggerFactory", "SqliteLogger")
diff --git a/mm_agents/coact/autogen/logger/base_logger.py b/mm_agents/coact/autogen/logger/base_logger.py
new file mode 100644
index 0000000..9b9269a
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/base_logger.py
@@ -0,0 +1,128 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import sqlite3
+import uuid
+from abc import ABC, abstractmethod
+from typing import TYPE_CHECKING, Any, Callable, TypeVar, Union
+
+if TYPE_CHECKING:
+    from openai import AzureOpenAI, OpenAI
+    from openai.types.chat import ChatCompletion
+
+    from .. import Agent, ConversableAgent, OpenAIWrapper
+
+F = TypeVar("F", bound=Callable[..., Any])
+ConfigItem = dict[str, Union[str, list[str]]]
+LLMConfig = dict[str, Union[None, float, int, ConfigItem, list[ConfigItem]]]
+
+
+class BaseLogger(ABC):
+    @abstractmethod
+    def start(self) -> str:
+        """Open a connection to the logging database, and start recording.
+
+        Returns:
+            session_id (str):     a unique id for the logging session
+        """
+        ...
+
+    @abstractmethod
+    def log_chat_completion(
+        self,
+        invocation_id: uuid.UUID,
+        client_id: int,
+        wrapper_id: int,
+        source: str | Agent,
+        request: dict[str, float | str | list[dict[str, str]]],
+        response: str | ChatCompletion,
+        is_cached: int,
+        cost: float,
+        start_time: str,
+    ) -> None:
+        """Log a chat completion to database.
+
+        In AG2, chat completions are somewhat complicated because they are handled by the `autogen.oai.OpenAIWrapper` class.
+        One invocation to `create` can lead to multiple underlying OpenAI calls, depending on the llm_config list used, and
+        any errors or retries.
+
+        Args:
+            invocation_id (uuid):               A unique identifier for the invocation to the OpenAIWrapper.create method call
+            client_id (int):                    A unique identifier for the underlying OpenAI client instance
+            wrapper_id (int):                   A unique identifier for the OpenAIWrapper instance
+            source (str or Agent):              The source/creator of the event as a string name or an Agent instance
+            request (dict):                     A dictionary representing the request or call to the OpenAI client endpoint
+            response (str or ChatCompletion):   The response from OpenAI
+            is_cached (int):                    1 if the response was a cache hit, 0 otherwise
+            cost(float):                        The cost for OpenAI response
+            start_time (str):                   A string representing the moment the request was initiated
+        """
+        ...
+
+    @abstractmethod
+    def log_new_agent(self, agent: ConversableAgent, init_args: dict[str, Any]) -> None:
+        """Log the birth of a new agent.
+
+        Args:
+            agent (ConversableAgent):   The agent to log.
+            init_args (dict):           The arguments passed to the construct the conversable agent
+        """
+        ...
+
+    @abstractmethod
+    def log_event(self, source: str | Agent, name: str, **kwargs: dict[str, Any]) -> None:
+        """Log an event for an agent.
+
+        Args:
+            source (str or Agent):      The source/creator of the event as a string name or an Agent instance
+            name (str):                 The name of the event
+            kwargs (dict):              The event information to log
+        """
+        ...
+
+    @abstractmethod
+    def log_new_wrapper(self, wrapper: OpenAIWrapper, init_args: dict[str, LLMConfig | list[LLMConfig]]) -> None:
+        """Log the birth of a new OpenAIWrapper.
+
+        Args:
+            wrapper (OpenAIWrapper):    The wrapper to log.
+            init_args (dict):           The arguments passed to the construct the wrapper
+        """
+        ...
+
+    @abstractmethod
+    def log_new_client(self, client: AzureOpenAI | OpenAI, wrapper: OpenAIWrapper, init_args: dict[str, Any]) -> None:
+        """Log the birth of a new OpenAIWrapper.
+
+        Args:
+            client: The client to log.
+            wrapper: The wrapper that created the client.
+            init_args: The arguments passed to the construct the client.
+        """
+        ...
+
+    @abstractmethod
+    def log_function_use(self, source: str | Agent, function: F, args: dict[str, Any], returns: Any) -> None:
+        """Log the use of a registered function (could be a tool)
+
+        Args:
+            source (str or Agent):      The source/creator of the event as a string name or an Agent instance
+            function (F):               The function information
+            args (dict):                The function args to log
+            returns (any):              The return
+        """
+
+    @abstractmethod
+    def stop(self) -> None:
+        """Close the connection to the logging database, and stop logging."""
+        ...
+
+    @abstractmethod
+    def get_connection(self) -> None | sqlite3.Connection:
+        """Return a connection to the logging database."""
+        ...
diff --git a/mm_agents/coact/autogen/logger/file_logger.py b/mm_agents/coact/autogen/logger/file_logger.py
new file mode 100644
index 0000000..bd3217b
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/file_logger.py
@@ -0,0 +1,261 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import json
+import logging
+import os
+import threading
+import uuid
+from typing import TYPE_CHECKING, Any, Callable, TypeVar
+
+from ..doc_utils import export_module
+from .base_logger import BaseLogger, LLMConfig
+from .logger_utils import get_current_ts, to_dict
+
+if TYPE_CHECKING:
+    from openai import AzureOpenAI, OpenAI
+    from openai.types.chat import ChatCompletion
+
+    from .. import Agent, ConversableAgent, OpenAIWrapper
+    from ..oai.anthropic import AnthropicClient
+    from ..oai.bedrock import BedrockClient
+    from ..oai.cerebras import CerebrasClient
+    from ..oai.cohere import CohereClient
+    from ..oai.gemini import GeminiClient
+    from ..oai.groq import GroqClient
+    from ..oai.mistral import MistralAIClient
+    from ..oai.ollama import OllamaClient
+    from ..oai.together import TogetherClient
+
+logger = logging.getLogger(__name__)
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+__all__ = ("FileLogger",)
+
+
+def safe_serialize(obj: Any) -> str:
+    def default(o: Any) -> str:
+        if hasattr(o, "to_json"):
+            return str(o.to_json())
+        else:
+            return f"<<non-serializable: {type(o).__qualname__}>>"
+
+    return json.dumps(obj, default=default)
+
+
+@export_module("autogen.logger")
+class FileLogger(BaseLogger):
+    def __init__(self, config: dict[str, Any]):
+        self.config = config
+        self.session_id = str(uuid.uuid4())
+
+        curr_dir = os.getcwd()
+        self.log_dir = os.path.join(curr_dir, "autogen_logs")
+        os.makedirs(self.log_dir, exist_ok=True)
+
+        self.log_file = os.path.join(self.log_dir, self.config.get("filename", "runtime.log"))
+        try:
+            with open(self.log_file, "a"):
+                pass
+        except Exception as e:
+            logger.error(f"[file_logger] Failed to create logging file: {e}")
+
+        self.logger = logging.getLogger(__name__)
+        self.logger.setLevel(logging.INFO)
+        file_handler = logging.FileHandler(self.log_file)
+        self.logger.addHandler(file_handler)
+
+    def start(self) -> str:
+        """Start the logger and return the session_id."""
+        try:
+            self.logger.info(f"Started new session with Session ID: {self.session_id}")
+        except Exception as e:
+            logger.error(f"[file_logger] Failed to create logging file: {e}")
+        finally:
+            return self.session_id
+
+    def log_chat_completion(
+        self,
+        invocation_id: uuid.UUID,
+        client_id: int,
+        wrapper_id: int,
+        source: str | Agent,
+        request: dict[str, float | str | list[dict[str, str]]],
+        response: str | ChatCompletion,
+        is_cached: int,
+        cost: float,
+        start_time: str,
+    ) -> None:
+        """Log a chat completion."""
+        thread_id = threading.get_ident()
+        source_name = (
+            source
+            if isinstance(source, str)
+            else source.name
+            if hasattr(source, "name") and source.name is not None
+            else ""
+        )
+        try:
+            log_data = json.dumps({
+                "invocation_id": str(invocation_id),
+                "client_id": client_id,
+                "wrapper_id": wrapper_id,
+                "request": to_dict(request),
+                "response": str(response),
+                "is_cached": is_cached,
+                "cost": cost,
+                "start_time": start_time,
+                "end_time": get_current_ts(),
+                "thread_id": thread_id,
+                "source_name": source_name,
+            })
+
+            self.logger.info(log_data)
+        except Exception as e:
+            self.logger.error(f"[file_logger] Failed to log chat completion: {e}")
+
+    def log_new_agent(self, agent: ConversableAgent, init_args: dict[str, Any] = {}) -> None:
+        """Log a new agent instance."""
+        thread_id = threading.get_ident()
+
+        try:
+            log_data = json.dumps({
+                "id": id(agent),
+                "agent_name": agent.name if hasattr(agent, "name") and agent.name is not None else "",
+                "wrapper_id": to_dict(
+                    agent.client.wrapper_id if hasattr(agent, "client") and agent.client is not None else ""
+                ),
+                "session_id": self.session_id,
+                "current_time": get_current_ts(),
+                "agent_type": type(agent).__name__,
+                "args": to_dict(init_args),
+                "thread_id": thread_id,
+            })
+            self.logger.info(log_data)
+        except Exception as e:
+            self.logger.error(f"[file_logger] Failed to log new agent: {e}")
+
+    def log_event(self, source: str | Agent, name: str, **kwargs: dict[str, Any]) -> None:
+        """Log an event from an agent or a string source."""
+        from .. import Agent
+
+        # This takes an object o as input and returns a string. If the object o cannot be serialized, instead of raising an error,
+        # it returns a string indicating that the object is non-serializable, along with its type's qualified name obtained using __qualname__.
+        json_args = json.dumps(kwargs, default=lambda o: f"<<non-serializable: {type(o).__qualname__}>>")
+        thread_id = threading.get_ident()
+
+        if isinstance(source, Agent):
+            try:
+                log_data = json.dumps({
+                    "source_id": id(source),
+                    "source_name": str(source.name) if hasattr(source, "name") else source,
+                    "event_name": name,
+                    "agent_module": source.__module__,
+                    "agent_class": source.__class__.__name__,
+                    "json_state": json_args,
+                    "timestamp": get_current_ts(),
+                    "thread_id": thread_id,
+                })
+                self.logger.info(log_data)
+            except Exception as e:
+                self.logger.error(f"[file_logger] Failed to log event {e}")
+        else:
+            try:
+                log_data = json.dumps({
+                    "source_id": id(source),
+                    "source_name": str(source.name) if hasattr(source, "name") else source,
+                    "event_name": name,
+                    "json_state": json_args,
+                    "timestamp": get_current_ts(),
+                    "thread_id": thread_id,
+                })
+                self.logger.info(log_data)
+            except Exception as e:
+                self.logger.error(f"[file_logger] Failed to log event {e}")
+
+    def log_new_wrapper(self, wrapper: OpenAIWrapper, init_args: dict[str, LLMConfig | list[LLMConfig]] = {}) -> None:
+        """Log a new wrapper instance."""
+        thread_id = threading.get_ident()
+
+        try:
+            log_data = json.dumps({
+                "wrapper_id": id(wrapper),
+                "session_id": self.session_id,
+                "json_state": json.dumps(init_args),
+                "timestamp": get_current_ts(),
+                "thread_id": thread_id,
+            })
+            self.logger.info(log_data)
+        except Exception as e:
+            self.logger.error(f"[file_logger] Failed to log event {e}")
+
+    def log_new_client(
+        self,
+        client: (
+            AzureOpenAI
+            | OpenAI
+            | CerebrasClient
+            | GeminiClient
+            | AnthropicClient
+            | MistralAIClient
+            | TogetherClient
+            | GroqClient
+            | CohereClient
+            | OllamaClient
+            | BedrockClient
+        ),
+        wrapper: OpenAIWrapper,
+        init_args: dict[str, Any],
+    ) -> None:
+        """Log a new client instance."""
+        thread_id = threading.get_ident()
+
+        try:
+            log_data = json.dumps({
+                "client_id": id(client),
+                "wrapper_id": id(wrapper),
+                "session_id": self.session_id,
+                "class": type(client).__name__,
+                "json_state": json.dumps(init_args),
+                "timestamp": get_current_ts(),
+                "thread_id": thread_id,
+            })
+            self.logger.info(log_data)
+        except Exception as e:
+            self.logger.error(f"[file_logger] Failed to log event {e}")
+
+    def log_function_use(self, source: str | Agent, function: F, args: dict[str, Any], returns: Any) -> None:
+        """Log a registered function(can be a tool) use from an agent or a string source."""
+        thread_id = threading.get_ident()
+
+        try:
+            log_data = json.dumps({
+                "source_id": id(source),
+                "source_name": str(source.name) if hasattr(source, "name") else source,
+                "agent_module": source.__module__,
+                "agent_class": source.__class__.__name__,
+                "timestamp": get_current_ts(),
+                "thread_id": thread_id,
+                "input_args": safe_serialize(args),
+                "returns": safe_serialize(returns),
+            })
+            self.logger.info(log_data)
+        except Exception as e:
+            self.logger.error(f"[file_logger] Failed to log event {e}")
+
+    def get_connection(self) -> None:
+        """Method is intentionally left blank because there is no specific connection needed for the FileLogger."""
+        pass
+
+    def stop(self) -> None:
+        """Close the file handler and remove it from the logger."""
+        for handler in self.logger.handlers:
+            if isinstance(handler, logging.FileHandler):
+                handler.close()
+                self.logger.removeHandler(handler)
diff --git a/mm_agents/coact/autogen/logger/logger_factory.py b/mm_agents/coact/autogen/logger/logger_factory.py
new file mode 100644
index 0000000..ccdbaaa
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/logger_factory.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from typing import Any, Literal, Optional
+
+from ..doc_utils import export_module
+from .base_logger import BaseLogger
+from .file_logger import FileLogger
+from .sqlite_logger import SqliteLogger
+
+__all__ = ("LoggerFactory",)
+
+
+@export_module("autogen.logger")
+class LoggerFactory:
+    """Factory class to create logger objects."""
+
+    @staticmethod
+    def get_logger(
+        logger_type: Literal["sqlite", "file"] = "sqlite", config: Optional[dict[str, Any]] = None
+    ) -> BaseLogger:
+        """Factory method to create logger objects.
+
+        Args:
+            logger_type (Literal["sqlite", "file"], optional): Type of logger. Defaults to "sqlite".
+            config (Optional[dict[str, Any]], optional): Configuration for logger. Defaults to None.
+
+        Returns:
+            BaseLogger: Logger object
+        """
+        if config is None:
+            config = {}
+
+        if logger_type == "sqlite":
+            return SqliteLogger(config)
+        elif logger_type == "file":
+            return FileLogger(config)
+        else:
+            raise ValueError(f"[logger_factory] Unknown logger type: {logger_type}")
diff --git a/mm_agents/coact/autogen/logger/logger_utils.py b/mm_agents/coact/autogen/logger/logger_utils.py
new file mode 100644
index 0000000..7b356ff
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/logger_utils.py
@@ -0,0 +1,57 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import inspect
+from datetime import datetime, timezone
+from pathlib import Path, PurePath
+from typing import Any, Union
+
+__all__ = ("get_current_ts", "to_dict")
+
+
+def get_current_ts() -> str:
+    """Get current timestamp in UTC timezone.
+
+    Returns:
+        str: Current timestamp in UTC timezone
+    """
+    return datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S.%f")
+
+
+def to_dict(
+    obj: Union[int, float, str, bool, dict[Any, Any], list[Any], tuple[Any, ...], Any],
+    exclude: tuple[str, ...] = (),
+    no_recursive: tuple[Any, ...] = (),
+) -> Any:
+    """Convert object to dictionary.
+
+    Args:
+        obj (Union[int, float, str, bool, dict[Any, Any], list[Any], tuple[Any, ...], Any]): Object to convert
+        exclude (tuple[str, ...], optional): Keys to exclude. Defaults to ().
+        no_recursive (tuple[Any, ...], optional): Types to exclude from recursive conversion. Defaults to ().
+    """
+    if isinstance(obj, (int, float, str, bool)):
+        return obj
+    elif isinstance(obj, (Path, PurePath)):
+        return str(obj)
+    elif callable(obj):
+        return inspect.getsource(obj).strip()
+    elif isinstance(obj, dict):
+        return {
+            str(k): to_dict(str(v)) if isinstance(v, no_recursive) else to_dict(v, exclude, no_recursive)
+            for k, v in obj.items()
+            if k not in exclude
+        }
+    elif isinstance(obj, (list, tuple)):
+        return [to_dict(str(v)) if isinstance(v, no_recursive) else to_dict(v, exclude, no_recursive) for v in obj]
+    elif hasattr(obj, "__dict__"):
+        return {
+            str(k): to_dict(str(v)) if isinstance(v, no_recursive) else to_dict(v, exclude, no_recursive)
+            for k, v in vars(obj).items()
+            if k not in exclude
+        }
+    else:
+        return obj
diff --git a/mm_agents/coact/autogen/logger/sqlite_logger.py b/mm_agents/coact/autogen/logger/sqlite_logger.py
new file mode 100644
index 0000000..2726f5f
--- /dev/null
+++ b/mm_agents/coact/autogen/logger/sqlite_logger.py
@@ -0,0 +1,523 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import json
+import logging
+import os
+import sqlite3
+import threading
+import uuid
+from typing import TYPE_CHECKING, Any, Callable, TypeVar
+
+from ..doc_utils import export_module
+from .base_logger import BaseLogger, LLMConfig
+from .logger_utils import get_current_ts, to_dict
+
+if TYPE_CHECKING:
+    from openai import AzureOpenAI, OpenAI
+    from openai.types.chat import ChatCompletion
+
+    from .. import Agent, ConversableAgent, OpenAIWrapper
+    from ..oai.anthropic import AnthropicClient
+    from ..oai.bedrock import BedrockClient
+    from ..oai.cerebras import CerebrasClient
+    from ..oai.cohere import CohereClient
+    from ..oai.gemini import GeminiClient
+    from ..oai.groq import GroqClient
+    from ..oai.mistral import MistralAIClient
+    from ..oai.ollama import OllamaClient
+    from ..oai.together import TogetherClient
+
+logger = logging.getLogger(__name__)
+lock = threading.Lock()
+
+__all__ = ("SqliteLogger",)
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+def safe_serialize(obj: Any) -> str:
+    """Safely serialize an object to JSON.
+
+    Args:
+        obj (Any): Object to serialize.
+
+    Returns:
+        str: Serialized object.
+    """
+
+    def default(o: Any) -> str:
+        if hasattr(o, "to_json"):
+            return str(o.to_json())
+        else:
+            return f"<<non-serializable: {type(o).__qualname__}>>"
+
+    return json.dumps(obj, default=default)
+
+
+@export_module("autogen.logger")
+class SqliteLogger(BaseLogger):
+    """Sqlite logger class."""
+
+    schema_version = 1
+
+    def __init__(self, config: dict[str, Any]):
+        """Initialize the SqliteLogger.
+
+        Args:
+            config (dict[str, Any]): Configuration for the logger.
+        """
+        self.config = config
+
+        try:
+            self.dbname = self.config.get("dbname", "logs.db")
+            self.con = sqlite3.connect(self.dbname, check_same_thread=False)
+            self.cur = self.con.cursor()
+            self.session_id = str(uuid.uuid4())
+        except sqlite3.Error as e:
+            logger.error(f"[SqliteLogger] Failed to connect to database {self.dbname}: {e}")
+
+    def start(self) -> str:
+        try:
+            query = """
+                CREATE TABLE IF NOT EXISTS chat_completions(
+                    id INTEGER PRIMARY KEY,
+                    invocation_id TEXT,
+                    client_id INTEGER,
+                    wrapper_id INTEGER,
+                    session_id TEXT,
+                    source_name TEXT,
+                    request TEXT,
+                    response TEXT,
+                    is_cached INEGER,
+                    cost REAL,
+                    start_time DATETIME DEFAULT CURRENT_TIMESTAMP,
+                    end_time DATETIME DEFAULT CURRENT_TIMESTAMP)
+            """
+            self._run_query(query=query)
+
+            query = """
+                CREATE TABLE IF NOT EXISTS agents (
+                    id INTEGER PRIMARY KEY,                             -- Key assigned by the database
+                    agent_id INTEGER,                                   -- result of python id(agent)
+                    wrapper_id INTEGER,                                 -- result of python id(agent.client)
+                    session_id TEXT,
+                    name TEXT,                                          -- agent.name
+                    class TEXT,                                         -- type or class name of agent
+                    init_args TEXT,                                     -- JSON serialization of constructor
+                    timestamp DATETIME DEFAULT CURRENT_TIMESTAMP,
+                    UNIQUE(agent_id, session_id))
+            """
+            self._run_query(query=query)
+
+            query = """
+                CREATE TABLE IF NOT EXISTS oai_wrappers (
+                    id INTEGER PRIMARY KEY,                             -- Key assigned by the database
+                    wrapper_id INTEGER,                                 -- result of python id(wrapper)
+                    session_id TEXT,
+                    init_args TEXT,                                     -- JSON serialization of constructor
+                    timestamp DATETIME DEFAULT CURRENT_TIMESTAMP,
+                    UNIQUE(wrapper_id, session_id))
+            """
+            self._run_query(query=query)
+
+            query = """
+                CREATE TABLE IF NOT EXISTS oai_clients (
+                    id INTEGER PRIMARY KEY,                             -- Key assigned by the database
+                    client_id INTEGER,                                  -- result of python id(client)
+                    wrapper_id INTEGER,                                 -- result of python id(wrapper)
+                    session_id TEXT,
+                    class TEXT,                                         -- type or class name of client
+                    init_args TEXT,                                     -- JSON serialization of constructor
+                    timestamp DATETIME DEFAULT CURRENT_TIMESTAMP,
+                    UNIQUE(client_id, session_id))
+            """
+            self._run_query(query=query)
+
+            query = """
+            CREATE TABLE IF NOT EXISTS version (
+                id INTEGER PRIMARY KEY CHECK (id = 1),                  -- id of the logging database
+                version_number INTEGER NOT NULL                         -- version of the logging database
+            );
+            """
+            self._run_query(query=query)
+
+            query = """
+            CREATE TABLE IF NOT EXISTS events (
+                event_name TEXT,
+                source_id INTEGER,
+                source_name TEXT,
+                agent_module TEXT DEFAULT NULL,
+                agent_class_name TEXT DEFAULT NULL,
+                id INTEGER PRIMARY KEY,
+                json_state TEXT,
+                timestamp DATETIME DEFAULT CURRENT_TIMESTAMP
+            );
+            """
+            self._run_query(query=query)
+
+            query = """
+                        CREATE TABLE IF NOT EXISTS function_calls (
+                            source_id INTEGER,
+                            source_name TEXT,
+                            function_name TEXT,
+                            args TEXT DEFAULT NULL,
+                            returns TEXT DEFAULT NULL,
+                            timestamp DATETIME DEFAULT CURRENT_TIMESTAMP
+                        );
+                        """
+            self._run_query(query=query)
+
+            current_version = self._get_current_db_version()
+            if current_version is None:
+                self._run_query(
+                    query="INSERT INTO version (id, version_number) VALUES (1, ?);", args=(SqliteLogger.schema_version,)
+                )
+            self._apply_migration()
+
+        except sqlite3.Error as e:
+            logger.error(f"[SqliteLogger] start logging error: {e}")
+        finally:
+            return self.session_id
+
+    def _get_current_db_version(self) -> None | int:
+        self.cur.execute("SELECT version_number FROM version ORDER BY id DESC LIMIT 1")
+        result = self.cur.fetchone()
+        return result[0] if result is not None else None
+
+    # Example migration script name format: 002_update_agents_table.sql
+    def _apply_migration(self, migrations_dir: str = "./migrations") -> None:
+        current_version = self._get_current_db_version()
+        current_version = SqliteLogger.schema_version if current_version is None else current_version
+
+        if os.path.isdir(migrations_dir):
+            migrations = sorted(os.listdir(migrations_dir))
+        else:
+            logger.info("no migration scripts, skip...")
+            return
+
+        migrations_to_apply = [m for m in migrations if int(m.split("_")[0]) > current_version]
+
+        for script in migrations_to_apply:
+            with open(script) as f:
+                migration_sql = f.read()
+                self._run_query_script(script=migration_sql)
+
+                latest_version = int(script.split("_")[0])
+                query = "UPDATE version SET version_number = ? WHERE id = 1"
+                args = (latest_version,)
+                self._run_query(query=query, args=args)
+
+    def _run_query(self, query: str, args: tuple[Any, ...] = ()) -> None:
+        """Executes a given SQL query.
+
+        Args:
+            query (str):        The SQL query to execute.
+            args (Tuple):       The arguments to pass to the SQL query.
+        """
+        try:
+            with lock:
+                self.cur.execute(query, args)
+                self.con.commit()
+        except Exception as e:
+            logger.error("[sqlite logger]Error running query with query %s and args %s: %s", query, args, e)
+
+    def _run_query_script(self, script: str) -> None:
+        """Executes SQL script.
+
+        Args:
+            script (str):       SQL script to execute.
+        """
+        try:
+            with lock:
+                self.cur.executescript(script)
+                self.con.commit()
+        except Exception as e:
+            logger.error("[sqlite logger]Error running query script %s: %s", script, e)
+
+    def log_chat_completion(
+        self,
+        invocation_id: uuid.UUID,
+        client_id: int,
+        wrapper_id: int,
+        source: str | Agent,
+        request: dict[str, float | str | list[dict[str, str]]],
+        response: str | ChatCompletion,
+        is_cached: int,
+        cost: float,
+        start_time: str,
+    ) -> None:
+        """Log chat completion.
+
+        Args:
+            invocation_id (uuid.UUID): Invocation ID.
+            client_id (int): Client ID.
+            wrapper_id (int): Wrapper ID.
+            source (str | Agent): Source of the chat completion.
+            request (dict[str, float | str | list[dict[str, str]]]): Request for the chat completion.
+            response (str | ChatCompletion): Response for the chat completion.
+            is_cached (int): Whether the response is cached.
+            cost (float): Cost of the chat completion.
+            start_time (str): Start time of the chat completion.
+        """
+        if self.con is None:
+            return
+
+        end_time = get_current_ts()
+
+        if response is None or isinstance(response, str):
+            response_messages = json.dumps({"response": response})
+        else:
+            response_messages = json.dumps(to_dict(response), indent=4)
+
+        source_name = (
+            source
+            if isinstance(source, str)
+            else source.name
+            if hasattr(source, "name") and source.name is not None
+            else ""
+        )
+
+        query = """
+            INSERT INTO chat_completions (
+                invocation_id, client_id, wrapper_id, session_id, request, response, is_cached, cost, start_time, end_time, source_name
+            ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+        """
+        args = (
+            invocation_id,
+            client_id,
+            wrapper_id,
+            self.session_id,
+            json.dumps(request),
+            response_messages,
+            is_cached,
+            cost,
+            start_time,
+            end_time,
+            source_name,
+        )
+
+        self._run_query(query=query, args=args)
+
+    def log_new_agent(self, agent: ConversableAgent, init_args: dict[str, Any]) -> None:
+        """Log new agent.
+
+        Args:
+            agent (ConversableAgent): Agent to log.
+            init_args (dict[str, Any]): Initialization arguments of the agent
+        """
+        from .. import Agent
+
+        if self.con is None:
+            return
+
+        args = to_dict(
+            init_args,
+            exclude=(
+                "self",
+                "__class__",
+                "api_key",
+                "organization",
+                "base_url",
+                "azure_endpoint",
+                "azure_ad_token",
+                "azure_ad_token_provider",
+            ),
+            no_recursive=(Agent,),
+        )
+
+        # We do an upsert since both the superclass and subclass may call this method (in that order)
+        query = """
+        INSERT INTO agents (agent_id, wrapper_id, session_id, name, class, init_args, timestamp) VALUES (?, ?, ?, ?, ?, ?, ?)
+        ON CONFLICT (agent_id, session_id) DO UPDATE SET
+            wrapper_id = excluded.wrapper_id,
+            name = excluded.name,
+            class = excluded.class,
+            init_args = excluded.init_args,
+            timestamp = excluded.timestamp
+        """
+        args = (
+            id(agent),
+            agent.client.wrapper_id if hasattr(agent, "client") and agent.client is not None else "",
+            self.session_id,
+            agent.name if hasattr(agent, "name") and agent.name is not None else "",
+            type(agent).__name__,
+            json.dumps(args),
+            get_current_ts(),
+        )
+        self._run_query(query=query, args=args)
+
+    def log_event(self, source: str | Agent, name: str, **kwargs: dict[str, Any]) -> None:
+        """Log event.
+
+        Args:
+            source (str | Agent): Source of the event.
+            name (str): Name of the event.
+            **kwargs (dict[str, Any]): Additional arguments for the event.
+        """
+        from autogen import Agent
+
+        if self.con is None:
+            return
+
+        json_args = json.dumps(kwargs, default=lambda o: f"<<non-serializable: {type(o).__qualname__}>>")
+
+        if isinstance(source, Agent):
+            query = """
+            INSERT INTO events (source_id, source_name, event_name, agent_module, agent_class_name, json_state, timestamp) VALUES (?, ?, ?, ?, ?, ?, ?)
+            """
+            args = (
+                id(source),
+                source.name if hasattr(source, "name") else source,
+                name,
+                source.__module__,
+                source.__class__.__name__,
+                json_args,
+                get_current_ts(),
+            )
+            self._run_query(query=query, args=args)
+        else:
+            query = """
+            INSERT INTO events (source_id, source_name, event_name, json_state, timestamp) VALUES (?, ?, ?, ?, ?)
+            """
+            args_str_based = (
+                id(source),
+                source.name if hasattr(source, "name") else source,
+                name,
+                json_args,
+                get_current_ts(),
+            )
+            self._run_query(query=query, args=args_str_based)
+
+    def log_new_wrapper(self, wrapper: OpenAIWrapper, init_args: dict[str, LLMConfig | list[LLMConfig]]) -> None:
+        """Log new wrapper.
+
+        Args:
+            wrapper (OpenAIWrapper): Wrapper to log.
+            init_args (dict[str, LLMConfig | list[LLMConfig]]): Initialization arguments of the wrapper
+        """
+        if self.con is None:
+            return
+
+        args = to_dict(
+            init_args,
+            exclude=(
+                "self",
+                "__class__",
+                "api_key",
+                "organization",
+                "base_url",
+                "azure_endpoint",
+                "azure_ad_token",
+                "azure_ad_token_provider",
+            ),
+        )
+
+        query = """
+        INSERT INTO oai_wrappers (wrapper_id, session_id, init_args, timestamp) VALUES (?, ?, ?, ?)
+        ON CONFLICT (wrapper_id, session_id) DO NOTHING;
+        """
+        args = (
+            id(wrapper),
+            self.session_id,
+            json.dumps(args),
+            get_current_ts(),
+        )
+        self._run_query(query=query, args=args)
+
+    def log_function_use(self, source: str | Agent, function: F, args: dict[str, Any], returns: Any) -> None:
+        """Log function use.
+
+        Args:
+            source (str | Agent): Source of the function use.
+            function (F): Function to log.
+            args (dict[str, Any]): Arguments of the function.
+            returns (Any): Returns of the function.
+        """
+        if self.con is None:
+            return
+
+        query = """
+        INSERT INTO function_calls (source_id, source_name, function_name, args, returns, timestamp) VALUES (?, ?, ?, ?, ?, ?)
+        """
+        query_args: tuple[Any, ...] = (
+            id(source),
+            source.name if hasattr(source, "name") else source,
+            function.__name__,
+            safe_serialize(args),
+            safe_serialize(returns),
+            get_current_ts(),
+        )
+        self._run_query(query=query, args=query_args)
+
+    def log_new_client(
+        self,
+        client: (
+            AzureOpenAI
+            | OpenAI
+            | CerebrasClient
+            | GeminiClient
+            | AnthropicClient
+            | MistralAIClient
+            | TogetherClient
+            | GroqClient
+            | CohereClient
+            | OllamaClient
+            | BedrockClient
+        ),
+        wrapper: OpenAIWrapper,
+        init_args: dict[str, Any],
+    ) -> None:
+        """Log new client.
+
+        Args:
+            client (AzureOpenAI | OpenAI | CerebrasClient | GeminiClient | AnthropicClient | MistralAIClient | TogetherClient | GroqClient | CohereClient | OllamaClient | BedrockClient): Client to log.
+            wrapper (OpenAIWrapper): Wrapper of the client.
+            init_args (dict[str, Any]): Initialization arguments of the client.
+        """
+        if self.con is None:
+            return
+
+        args = to_dict(
+            init_args,
+            exclude=(
+                "self",
+                "__class__",
+                "api_key",
+                "organization",
+                "base_url",
+                "azure_endpoint",
+                "azure_ad_token",
+                "azure_ad_token_provider",
+            ),
+        )
+
+        query = """
+        INSERT INTO oai_clients (client_id, wrapper_id, session_id, class, init_args, timestamp) VALUES (?, ?, ?, ?, ?, ?)
+        ON CONFLICT (client_id, session_id) DO NOTHING;
+        """
+        args = (
+            id(client),
+            id(wrapper),
+            self.session_id,
+            type(client).__name__,
+            json.dumps(args),
+            get_current_ts(),
+        )
+        self._run_query(query=query, args=args)
+
+    def stop(self) -> None:
+        """Stop the logger"""
+        if self.con:
+            self.con.close()
+
+    def get_connection(self) -> None | sqlite3.Connection:
+        """Get connection."""
+        if self.con:
+            return self.con
+        return None
diff --git a/mm_agents/coact/autogen/messages/__init__.py b/mm_agents/coact/autogen/messages/__init__.py
new file mode 100644
index 0000000..d7616c3
--- /dev/null
+++ b/mm_agents/coact/autogen/messages/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .base_message import BaseMessage, get_annotated_type_for_message_classes, wrap_message
+
+__all__ = ["BaseMessage", "get_annotated_type_for_message_classes", "wrap_message"]
diff --git a/mm_agents/coact/autogen/messages/agent_messages.py b/mm_agents/coact/autogen/messages/agent_messages.py
new file mode 100644
index 0000000..be2e4c3
--- /dev/null
+++ b/mm_agents/coact/autogen/messages/agent_messages.py
@@ -0,0 +1,948 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from abc import ABC
+from copy import deepcopy
+from typing import TYPE_CHECKING, Any, Callable, Literal, Optional, Union
+from uuid import UUID
+
+from pydantic import BaseModel, field_validator
+from termcolor import colored
+
+from ..agentchat.agent import LLMMessageType
+from ..code_utils import content_str
+from ..events import deprecated_by
+from ..events.agent_events import (
+    ClearAgentsHistoryEvent,
+    ClearConversableAgentHistoryEvent,
+    ClearConversableAgentHistoryWarningEvent,
+    ConversableAgentUsageSummaryEvent,
+    ConversableAgentUsageSummaryNoCostIncurredEvent,
+    ExecuteCodeBlockEvent,
+    ExecuteFunctionEvent,
+    ExecutedFunctionEvent,
+    FunctionCallEvent,
+    FunctionResponseEvent,
+    GenerateCodeExecutionReplyEvent,
+    GroupChatResumeEvent,
+    GroupChatRunChatEvent,
+    PostCarryoverProcessingEvent,
+    SelectSpeakerEvent,
+    SelectSpeakerInvalidInputEvent,
+    SelectSpeakerTryCountExceededEvent,
+    SpeakerAttemptFailedMultipleAgentsEvent,
+    SpeakerAttemptFailedNoAgentsEvent,
+    SpeakerAttemptSuccessfulEvent,
+    TerminationAndHumanReplyNoInputEvent,
+    TerminationEvent,
+    TextEvent,
+    ToolCallEvent,
+    ToolResponseEvent,
+    UsingAutoReplyEvent,
+)
+from ..import_utils import optional_import_block, require_optional_import
+from ..oai.client import OpenAIWrapper
+from .base_message import BaseMessage, wrap_message
+
+with optional_import_block() as result:
+    from PIL.Image import Image
+
+IS_PIL_AVAILABLE = result.is_successful
+
+if TYPE_CHECKING:
+    from ..agentchat.agent import Agent
+    from ..coding.base import CodeBlock
+
+
+__all__ = [
+    "ClearAgentsHistoryMessage",
+    "ClearConversableAgentHistoryMessage",
+    "ConversableAgentUsageSummaryMessage",
+    "ConversableAgentUsageSummaryNoCostIncurredMessage",
+    "ExecuteCodeBlockMessage",
+    "ExecuteFunctionMessage",
+    "FunctionCallMessage",
+    "FunctionResponseMessage",
+    "GenerateCodeExecutionReplyMessage",
+    "GroupChatResumeMessage",
+    "GroupChatRunChatMessage",
+    "PostCarryoverProcessingMessage",
+    "SelectSpeakerMessage",
+    "SpeakerAttemptFailedMultipleAgentsMessage",
+    "SpeakerAttemptFailedNoAgentsMessage",
+    "SpeakerAttemptSuccessfulMessage",
+    "TerminationAndHumanReplyNoInputMessage",
+    "TerminationMessage",
+    "TextMessage",
+    "ToolCallMessage",
+    "ToolResponseMessage",
+]
+
+MessageRole = Literal["assistant", "function", "tool"]
+
+
+class BasePrintReceivedMessage(BaseMessage, ABC):
+    content: Union[str, int, float, bool]
+    sender_name: str
+    recipient_name: str
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        f(f"{colored(self.sender_name, 'yellow')} (to {self.recipient_name}):\n", flush=True)
+
+
+@deprecated_by(FunctionResponseEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class FunctionResponseMessage(BasePrintReceivedMessage):
+    name: Optional[str] = None
+    role: MessageRole = "function"
+    content: Union[str, int, float, bool]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        id = self.name or "No id found"
+        func_print = f"***** Response from calling {self.role} ({id}) *****"
+        f(colored(func_print, "green"), flush=True)
+        f(self.content, flush=True)
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+class ToolResponse(BaseModel):
+    tool_call_id: Optional[str] = None
+    role: MessageRole = "tool"
+    content: Union[str, int, float, bool]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        id = self.tool_call_id or "No id found"
+        tool_print = f"***** Response from calling {self.role} ({id}) *****"
+        f(colored(tool_print, "green"), flush=True)
+        f(self.content, flush=True)
+        f(colored("*" * len(tool_print), "green"), flush=True)
+
+
+@deprecated_by(ToolResponseEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class ToolResponseMessage(BasePrintReceivedMessage):
+    role: MessageRole = "tool"
+    tool_responses: list[ToolResponse]
+    content: Union[str, int, float, bool]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        for tool_response in self.tool_responses:
+            tool_response.print(f)
+            f("\n", "-" * 80, flush=True, sep="")
+
+
+class FunctionCall(BaseModel):
+    name: Optional[str] = None
+    arguments: Optional[str] = None
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        name = self.name or "(No function name found)"
+        arguments = self.arguments or "(No arguments found)"
+
+        func_print = f"***** Suggested function call: {name} *****"
+        f(colored(func_print, "green"), flush=True)
+        f(
+            "Arguments: \n",
+            arguments,
+            flush=True,
+            sep="",
+        )
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+
+@deprecated_by(FunctionCallEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class FunctionCallMessage(BasePrintReceivedMessage):
+    content: Optional[Union[str, int, float, bool]] = None  # type: ignore [assignment]
+    function_call: FunctionCall
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(self.content, flush=True)
+
+        self.function_call.print(f)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+class ToolCall(BaseModel):
+    id: Optional[str] = None
+    function: FunctionCall
+    type: str
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        id = self.id or "No tool call id found"
+
+        name = self.function.name or "(No function name found)"
+        arguments = self.function.arguments or "(No arguments found)"
+
+        func_print = f"***** Suggested tool call ({id}): {name} *****"
+        f(colored(func_print, "green"), flush=True)
+        f(
+            "Arguments: \n",
+            arguments,
+            flush=True,
+            sep="",
+        )
+        f(colored("*" * len(func_print), "green"), flush=True)
+
+
+@deprecated_by(ToolCallEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class ToolCallMessage(BasePrintReceivedMessage):
+    content: Optional[Union[str, int, float, bool]] = None  # type: ignore [assignment]
+    refusal: Optional[str] = None
+    role: Optional[MessageRole] = None
+    audio: Optional[str] = None
+    function_call: Optional[FunctionCall] = None
+    tool_calls: list[ToolCall]
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(self.content, flush=True)
+
+        for tool_call in self.tool_calls:
+            tool_call.print(f)
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+@deprecated_by(TextEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class TextMessage(BasePrintReceivedMessage):
+    content: Optional[Union[str, int, float, bool, list[dict[str, Union[str, dict[str, Any]]]]]] = None  # type: ignore [assignment]
+
+    @classmethod
+    @require_optional_import("PIL", "unknown")
+    def _replace_pil_image_with_placeholder(cls, image_url: dict[str, Any]) -> None:
+        if isinstance(image_url, dict) and "url" in image_url and isinstance(image_url["url"], Image):
+            image_url["url"] = "<image>"
+
+    @field_validator("content", mode="before")
+    @classmethod
+    def validate_and_encode_content(
+        cls, content: Optional[Union[str, int, float, bool, list[dict[str, Union[str, dict[str, Any]]]]]]
+    ) -> Optional[Union[str, int, float, bool, list[dict[str, Union[str, dict[str, Any]]]]]]:
+        if not IS_PIL_AVAILABLE:
+            return content
+
+        if not isinstance(content, list):
+            return content
+
+        for item in content:
+            if isinstance(item, dict) and "image_url" in item:
+                cls._replace_pil_image_with_placeholder(item["image_url"])
+
+        return content
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+        super().print(f)
+
+        if self.content is not None:
+            f(content_str(self.content), flush=True)  # type: ignore [arg-type]
+
+        f("\n", "-" * 80, flush=True, sep="")
+
+
+def create_received_message_model(
+    *, uuid: Optional[UUID] = None, message: dict[str, Any], sender: "Agent", recipient: "Agent"
+) -> Union[FunctionResponseMessage, ToolResponseMessage, FunctionCallMessage, ToolCallMessage, TextMessage]:
+    # print(f"{message=}")
+    # print(f"{sender=}")
+
+    role = message.get("role")
+    if role == "function":
+        return FunctionResponseMessage(**message, sender_name=sender.name, recipient_name=recipient.name, uuid=uuid)
+    if role == "tool":
+        return ToolResponseMessage(**message, sender_name=sender.name, recipient_name=recipient.name, uuid=uuid)
+
+    # Role is neither function nor tool
+
+    if message.get("function_call"):
+        return FunctionCallMessage(
+            **message,
+            sender_name=sender.name,
+            recipient_name=recipient.name,
+            uuid=uuid,
+        )
+
+    if message.get("tool_calls"):
+        return ToolCallMessage(
+            **message,
+            sender_name=sender.name,
+            recipient_name=recipient.name,
+            uuid=uuid,
+        )
+
+    # Now message is a simple content message
+    content = message.get("content")
+    allow_format_str_template = (
+        recipient.llm_config.get("allow_format_str_template", False) if recipient.llm_config else False  # type: ignore [attr-defined]
+    )
+    if content is not None and "context" in message:
+        content = OpenAIWrapper.instantiate(
+            content,  # type: ignore [arg-type]
+            message["context"],
+            allow_format_str_template,
+        )
+
+    return TextMessage(
+        content=content,
+        sender_name=sender.name,
+        recipient_name=recipient.name,
+        uuid=uuid,
+    )
+
+
+@deprecated_by(PostCarryoverProcessingEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class PostCarryoverProcessingMessage(BaseMessage):
+    carryover: Union[str, list[Union[str, dict[str, Any], Any]]]
+    message: str
+    verbose: bool = False
+
+    sender_name: str
+    recipient_name: str
+    summary_method: str
+    summary_args: Optional[dict[str, Any]] = None
+    max_turns: Optional[int] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, chat_info: dict[str, Any]):
+        carryover = chat_info.get("carryover", "")
+        message = chat_info.get("message")
+        verbose = chat_info.get("verbose", False)
+
+        sender_name = chat_info["sender"].name
+        recipient_name = chat_info["recipient"].name
+        summary_args = chat_info.get("summary_args")
+        max_turns = chat_info.get("max_turns")
+
+        # Fix Callable in chat_info
+        summary_method = chat_info.get("summary_method", "")
+        if callable(summary_method):
+            summary_method = summary_method.__name__
+
+        print_message = ""
+        if isinstance(message, str):
+            print_message = message
+        elif callable(message):
+            print_message = "Callable: " + message.__name__
+        elif isinstance(message, dict):
+            print_message = "Dict: " + str(message)
+        elif message is None:
+            print_message = "None"
+
+        super().__init__(
+            uuid=uuid,
+            carryover=carryover,
+            message=print_message,
+            verbose=verbose,
+            summary_method=summary_method,
+            summary_args=summary_args,
+            max_turns=max_turns,
+            sender_name=sender_name,
+            recipient_name=recipient_name,
+        )
+
+    def _process_carryover(self) -> str:
+        if not isinstance(self.carryover, list):
+            return self.carryover
+
+        print_carryover = []
+        for carryover_item in self.carryover:
+            if isinstance(carryover_item, str):
+                print_carryover.append(carryover_item)
+            elif isinstance(carryover_item, dict) and "content" in carryover_item:
+                print_carryover.append(str(carryover_item["content"]))
+            else:
+                print_carryover.append(str(carryover_item))
+
+        return ("\n").join(print_carryover)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        print_carryover = self._process_carryover()
+
+        f(colored("\n" + "*" * 80, "blue"), flush=True, sep="")
+        f(
+            colored(
+                "Starting a new chat....",
+                "blue",
+            ),
+            flush=True,
+        )
+        if self.verbose:
+            f(colored("Message:\n" + self.message, "blue"), flush=True)
+            f(colored("Carryover:\n" + print_carryover, "blue"), flush=True)
+        f(colored("\n" + "*" * 80, "blue"), flush=True, sep="")
+
+
+@deprecated_by(ClearAgentsHistoryEvent, param_mapping={"nr_messages_to_preserve": "nr_events_to_preserve"})
+@wrap_message
+class ClearAgentsHistoryMessage(BaseMessage):
+    agent_name: Optional[str] = None
+    nr_messages_to_preserve: Optional[int] = None
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        agent: Optional["Agent"] = None,
+        nr_messages_to_preserve: Optional[int] = None,
+    ):
+        return super().__init__(
+            uuid=uuid, agent_name=agent.name if agent else None, nr_messages_to_preserve=nr_messages_to_preserve
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        if self.agent_name:
+            if self.nr_messages_to_preserve:
+                f(f"Clearing history for {self.agent_name} except last {self.nr_messages_to_preserve} messages.")
+            else:
+                f(f"Clearing history for {self.agent_name}.")
+        else:
+            if self.nr_messages_to_preserve:
+                f(f"Clearing history for all agents except last {self.nr_messages_to_preserve} messages.")
+            else:
+                f("Clearing history for all agents.")
+
+
+# todo: break into multiple messages
+@deprecated_by(SpeakerAttemptSuccessfulEvent)
+@wrap_message
+class SpeakerAttemptSuccessfulMessage(BaseMessage):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        selected_agent_name = next(iter(self.mentions))
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt {self.attempt} of {self.attempt + self.attempts_left} successfully selected: {selected_agent_name}",
+                "green",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(SpeakerAttemptFailedMultipleAgentsEvent)
+@wrap_message
+class SpeakerAttemptFailedMultipleAgentsMessage(BaseMessage):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt {self.attempt} of {self.attempt + self.attempts_left} failed as it included multiple agent names.",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(SpeakerAttemptFailedNoAgentsEvent)
+@wrap_message
+class SpeakerAttemptFailedNoAgentsMessage(BaseMessage):
+    mentions: dict[str, int]
+    attempt: int
+    attempts_left: int
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        mentions: dict[str, int],
+        attempt: int,
+        attempts_left: int,
+        select_speaker_auto_verbose: Optional[bool] = False,
+    ):
+        super().__init__(
+            uuid=uuid,
+            mentions=deepcopy(mentions),
+            attempt=attempt,
+            attempts_left=attempts_left,
+            verbose=select_speaker_auto_verbose,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f">>>>>>>> Select speaker attempt #{self.attempt} failed as it did not include any agent names.",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(GroupChatResumeEvent, param_mapping={"messages": "events"})
+@wrap_message
+class GroupChatResumeMessage(BaseMessage):
+    last_speaker_name: str
+    messages: list[LLMMessageType]
+    verbose: Optional[bool] = False
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        last_speaker_name: str,
+        messages: list["LLMMessageType"],
+        silent: Optional[bool] = False,
+    ):
+        super().__init__(uuid=uuid, last_speaker_name=last_speaker_name, messages=messages, verbose=not silent)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            f"Prepared group chat with {len(self.messages)} messages, the last speaker is",
+            colored(self.last_speaker_name, "yellow"),
+            flush=True,
+        )
+
+
+@deprecated_by(GroupChatRunChatEvent)
+@wrap_message
+class GroupChatRunChatMessage(BaseMessage):
+    speaker_name: str
+    verbose: Optional[bool] = False
+
+    def __init__(self, *, uuid: Optional[UUID] = None, speaker: "Agent", silent: Optional[bool] = False):
+        super().__init__(uuid=uuid, speaker_name=speaker.name, verbose=not silent)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\nNext speaker: {self.speaker_name}\n", "green"), flush=True)
+
+
+@deprecated_by(
+    TerminationAndHumanReplyNoInputEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"}
+)
+@wrap_message
+class TerminationAndHumanReplyNoInputMessage(BaseMessage):
+    """When the human-in-the-loop is prompted but provides no input."""
+
+    no_human_input_msg: str
+    sender_name: str
+    recipient_name: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        no_human_input_msg: str,
+        sender: Optional["Agent"] = None,
+        recipient: "Agent",
+    ):
+        super().__init__(
+            uuid=uuid,
+            no_human_input_msg=no_human_input_msg,
+            sender_name=sender.name if sender else "No sender",
+            recipient_name=recipient.name,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\n>>>>>>>> {self.no_human_input_msg}", "red"), flush=True)
+
+
+@deprecated_by(UsingAutoReplyEvent, param_mapping={"sender_name": "sender", "recipient_name": "recipient"})
+@wrap_message
+class UsingAutoReplyMessage(BaseMessage):
+    human_input_mode: str
+    sender_name: str
+    recipient_name: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        human_input_mode: str,
+        sender: Optional["Agent"] = None,
+        recipient: "Agent",
+    ):
+        super().__init__(
+            uuid=uuid,
+            human_input_mode=human_input_mode,
+            sender_name=sender.name if sender else "No sender",
+            recipient_name=recipient.name,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored("\n>>>>>>>> USING AUTO REPLY...", "red"), flush=True)
+
+
+@deprecated_by(TerminationEvent)
+@wrap_message
+class TerminationMessage(BaseMessage):
+    """When a workflow termination condition is met"""
+
+    termination_reason: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        termination_reason: str,
+    ):
+        super().__init__(
+            uuid=uuid,
+            termination_reason=termination_reason,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(colored(f"\n>>>>>>>> TERMINATING RUN ({str(self.uuid)}): {self.termination_reason}", "red"), flush=True)
+
+
+@deprecated_by(ExecuteCodeBlockEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ExecuteCodeBlockMessage(BaseMessage):
+    code: str
+    language: str
+    code_block_count: int
+    recipient_name: str
+
+    def __init__(
+        self, *, uuid: Optional[UUID] = None, code: str, language: str, code_block_count: int, recipient: "Agent"
+    ):
+        super().__init__(
+            uuid=uuid, code=code, language=language, code_block_count=code_block_count, recipient_name=recipient.name
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTING CODE BLOCK {self.code_block_count} (inferred language is {self.language})...",
+                "red",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(ExecuteFunctionEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ExecuteFunctionMessage(BaseMessage):
+    func_name: str
+    call_id: Optional[str] = None
+    arguments: dict[str, Any]
+    recipient_name: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        func_name: str,
+        call_id: Optional[str] = None,
+        arguments: dict[str, Any],
+        recipient: "Agent",
+    ):
+        super().__init__(
+            uuid=uuid, func_name=func_name, call_id=call_id, arguments=arguments, recipient_name=recipient.name
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTING FUNCTION {self.func_name}...\nCall ID: {self.call_id}\nInput arguments: {self.arguments}",
+                "magenta",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(ExecutedFunctionEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ExecutedFunctionMessage(BaseMessage):
+    func_name: str
+    call_id: Optional[str] = None
+    arguments: dict[str, Any]
+    content: str
+    recipient_name: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        func_name: str,
+        call_id: Optional[str] = None,
+        arguments: dict[str, Any],
+        content: str,
+        recipient: "Agent",
+    ):
+        super().__init__(
+            uuid=uuid,
+            func_name=func_name,
+            call_id=call_id,
+            arguments=arguments,
+            content=content,
+            recipient_name=recipient.name,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                f"\n>>>>>>>> EXECUTED FUNCTION {self.func_name}...\nCall ID: {self.call_id}\nInput arguments: {self.arguments}\nOutput:\n{self.content}",
+                "magenta",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(SelectSpeakerEvent)
+@wrap_message
+class SelectSpeakerMessage(BaseMessage):
+    agent_names: Optional[list[str]] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, agents: Optional[list["Agent"]] = None):
+        agent_names = [agent.name for agent in agents] if agents else None
+        super().__init__(uuid=uuid, agent_names=agent_names)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f("Please select the next speaker from the following list:")
+        agent_names = self.agent_names or []
+        for i, agent_name in enumerate(agent_names):
+            f(f"{i + 1}: {agent_name}")
+
+
+@deprecated_by(SelectSpeakerTryCountExceededEvent)
+@wrap_message
+class SelectSpeakerTryCountExceededMessage(BaseMessage):
+    try_count: int
+    agent_names: Optional[list[str]] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, try_count: int, agents: Optional[list["Agent"]] = None):
+        agent_names = [agent.name for agent in agents] if agents else None
+        super().__init__(uuid=uuid, try_count=try_count, agent_names=agent_names)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"You have tried {self.try_count} times. The next speaker will be selected automatically.")
+
+
+@deprecated_by(SelectSpeakerInvalidInputEvent)
+@wrap_message
+class SelectSpeakerInvalidInputMessage(BaseMessage):
+    agent_names: Optional[list[str]] = None
+
+    def __init__(self, *, uuid: Optional[UUID] = None, agents: Optional[list["Agent"]] = None):
+        agent_names = [agent.name for agent in agents] if agents else None
+        super().__init__(uuid=uuid, agent_names=agent_names)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"Invalid input. Please enter a number between 1 and {len(self.agent_names or [])}.")
+
+
+@deprecated_by(
+    ClearConversableAgentHistoryEvent,
+    param_mapping={"no_messages_preserved": "no_events_preserved", "recipient_name": "recipient"},
+)
+@wrap_message
+class ClearConversableAgentHistoryMessage(BaseMessage):
+    agent_name: str
+    recipient_name: str
+    no_messages_preserved: int
+
+    def __init__(self, *, uuid: Optional[UUID] = None, agent: "Agent", no_messages_preserved: Optional[int] = None):
+        super().__init__(
+            uuid=uuid,
+            agent_name=agent.name,
+            recipient_name=agent.name,
+            no_messages_preserved=no_messages_preserved,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        for _ in range(self.no_messages_preserved):
+            f(
+                f"Preserving one more message for {self.agent_name} to not divide history between tool call and "
+                f"tool response."
+            )
+
+
+@deprecated_by(ClearConversableAgentHistoryWarningEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ClearConversableAgentHistoryWarningMessage(BaseMessage):
+    recipient_name: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: "Agent"):
+        super().__init__(
+            uuid=uuid,
+            recipient_name=recipient.name,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(
+            colored(
+                "WARNING: `nr_preserved_messages` is ignored when clearing chat history with a specific agent.",
+                "yellow",
+            ),
+            flush=True,
+        )
+
+
+@deprecated_by(
+    GenerateCodeExecutionReplyEvent,
+    param_mapping={"sender_name": "sender", "recipient_name": "recipient", "code_block_languages": "code_blocks"},
+)
+@wrap_message
+class GenerateCodeExecutionReplyMessage(BaseMessage):
+    code_block_languages: list[str]
+    sender_name: Optional[str] = None
+    recipient_name: str
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        code_blocks: list["CodeBlock"],
+        sender: Optional["Agent"] = None,
+        recipient: "Agent",
+    ):
+        code_block_languages = [code_block.language for code_block in code_blocks]
+
+        super().__init__(
+            uuid=uuid,
+            code_block_languages=code_block_languages,
+            sender_name=sender.name if sender else None,
+            recipient_name=recipient.name,
+        )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        num_code_blocks = len(self.code_block_languages)
+        if num_code_blocks == 1:
+            f(
+                colored(
+                    f"\n>>>>>>>> EXECUTING CODE BLOCK (inferred language is {self.code_block_languages[0]})...",
+                    "red",
+                ),
+                flush=True,
+            )
+        else:
+            f(
+                colored(
+                    f"\n>>>>>>>> EXECUTING {num_code_blocks} CODE BLOCKS (inferred languages are [{', '.join([x for x in self.code_block_languages])}])...",
+                    "red",
+                ),
+                flush=True,
+            )
+
+
+@deprecated_by(ConversableAgentUsageSummaryNoCostIncurredEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ConversableAgentUsageSummaryNoCostIncurredMessage(BaseMessage):
+    recipient_name: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: "Agent"):
+        super().__init__(uuid=uuid, recipient_name=recipient.name)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"No cost incurred from agent '{self.recipient_name}'.")
+
+
+@deprecated_by(ConversableAgentUsageSummaryEvent, param_mapping={"recipient_name": "recipient"})
+@wrap_message
+class ConversableAgentUsageSummaryMessage(BaseMessage):
+    recipient_name: str
+
+    def __init__(self, *, uuid: Optional[UUID] = None, recipient: "Agent"):
+        super().__init__(uuid=uuid, recipient_name=recipient.name)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(f"Agent '{self.recipient_name}':")
diff --git a/mm_agents/coact/autogen/messages/base_message.py b/mm_agents/coact/autogen/messages/base_message.py
new file mode 100644
index 0000000..d530e16
--- /dev/null
+++ b/mm_agents/coact/autogen/messages/base_message.py
@@ -0,0 +1,107 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+from abc import ABC
+from typing import Annotated, Any, Callable, Literal, Optional, TypeVar, Union
+from uuid import UUID, uuid4
+
+from pydantic import BaseModel, Field, create_model
+
+from ..doc_utils import export_module
+
+PetType = TypeVar("PetType", bound=Literal["cat", "dog"])
+
+__all__ = ["BaseMessage", "get_annotated_type_for_message_classes", "wrap_message"]
+
+
+@export_module("autogen.messages")
+class BaseMessage(BaseModel, ABC):
+    uuid: UUID
+
+    def __init__(self, uuid: Optional[UUID] = None, **kwargs: Any) -> None:
+        """Base message class
+
+        Args:
+            uuid (Optional[UUID], optional): Unique identifier for the message. Defaults to None.
+            **kwargs (Any): Additional keyword arguments
+        """
+        uuid = uuid or uuid4()
+        super().__init__(uuid=uuid, **kwargs)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        """Print message
+
+        Args:
+            f (Optional[Callable[..., Any]], optional): Print function. If none, python's default print will be used.
+        """
+        ...
+
+
+def camel2snake(name: str) -> str:
+    return "".join(["_" + i.lower() if i.isupper() else i for i in name]).lstrip("_")
+
+
+_message_classes: dict[str, type[BaseModel]] = {}
+
+
+@export_module("autogen.messages")
+def wrap_message(message_cls: type[BaseMessage]) -> type[BaseModel]:
+    """Wrap a message class with a type field to be used in a union type
+
+    This is needed for proper serialization and deserialization of messages in a union type.
+
+    Args:
+        message_cls (type[BaseMessage]): Message class to wrap
+    """
+    global _message_classes
+
+    if not message_cls.__name__.endswith("Message"):
+        raise ValueError("Message class name must end with 'Message'")
+
+    type_name = camel2snake(message_cls.__name__)
+    type_name = type_name[: -len("_message")]
+
+    class WrapperBase(BaseModel):
+        # these types are generated dynamically so we need to disable the type checker
+        type: Literal[type_name] = type_name  # type: ignore[valid-type]
+        content: message_cls  # type: ignore[valid-type]
+
+        def __init__(self, *args: Any, **data: Any):
+            if set(data.keys()) == {"type", "content"} and "content" in data:
+                super().__init__(*args, **data)
+            else:
+                if "content" in data:
+                    content = data.pop("content")
+                    super().__init__(*args, content=message_cls(*args, **data, content=content), **data)
+                else:
+                    super().__init__(content=message_cls(*args, **data), **data)
+
+        def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+            self.content.print(f)  # type: ignore[attr-defined]
+
+    wrapper_cls = create_model(message_cls.__name__, __base__=WrapperBase)
+
+    # Preserve the original class's docstring and other attributes
+    wrapper_cls.__doc__ = message_cls.__doc__
+    wrapper_cls.__module__ = message_cls.__module__
+
+    # Copy any other relevant attributes/metadata from the original class
+    if hasattr(message_cls, "__annotations__"):
+        wrapper_cls.__annotations__ = message_cls.__annotations__
+
+    _message_classes[type_name] = wrapper_cls
+
+    return wrapper_cls
+
+
+@export_module("autogen.messages")
+def get_annotated_type_for_message_classes() -> type[Any]:
+    # this is a dynamic type so we need to disable the type checker
+    union_type = Union[tuple(_message_classes.values())]  # type: ignore[valid-type]
+    return Annotated[union_type, Field(discriminator="type")]  # type: ignore[return-value]
+
+
+def get_message_classes() -> dict[str, type[BaseModel]]:
+    return _message_classes
diff --git a/mm_agents/coact/autogen/messages/client_messages.py b/mm_agents/coact/autogen/messages/client_messages.py
new file mode 100644
index 0000000..f2a7341
--- /dev/null
+++ b/mm_agents/coact/autogen/messages/client_messages.py
@@ -0,0 +1,171 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Callable, Literal, Optional, Union
+from uuid import UUID
+
+from pydantic import BaseModel
+
+from ..events import deprecated_by
+from ..events.client_events import StreamEvent, UsageSummaryEvent
+from .base_message import BaseMessage, wrap_message
+
+__all__ = ["UsageSummaryMessage"]
+
+
+class ModelUsageSummary(BaseModel):
+    """Model usage summary."""
+
+    model: str
+    """Model name."""
+    completion_tokens: int
+    """Number of tokens used for completion."""
+    cost: float
+    """Cost of the completion."""
+    prompt_tokens: int
+    """Number of tokens used for prompt."""
+    total_tokens: int
+    """Total number of tokens used."""
+
+
+class ActualUsageSummary(BaseModel):
+    """Actual usage summary."""
+
+    usages: Optional[list[ModelUsageSummary]] = None
+    """List of model usage summaries."""
+    total_cost: Optional[float] = None
+    """Total cost."""
+
+
+class TotalUsageSummary(BaseModel):
+    """Total usage summary."""
+
+    usages: Optional[list[ModelUsageSummary]] = None
+    """List of model usage summaries."""
+    total_cost: Optional[float] = None
+    """Total cost."""
+
+
+Mode = Literal["both", "total", "actual"]
+
+
+def _change_usage_summary_format(
+    actual_usage_summary: Optional[dict[str, Any]] = None, total_usage_summary: Optional[dict[str, Any]] = None
+) -> dict[str, dict[str, Any]]:
+    summary: dict[str, Any] = {}
+
+    for usage_type, usage_summary in {"actual": actual_usage_summary, "total": total_usage_summary}.items():
+        if usage_summary is None:
+            summary[usage_type] = {"usages": None, "total_cost": None}
+            continue
+
+        usage_summary_altered_format: dict[str, list[dict[str, Any]]] = {"usages": []}
+        for k, v in usage_summary.items():
+            if isinstance(k, str) and isinstance(v, dict):
+                current_usage = {key: value for key, value in v.items()}
+                current_usage["model"] = k
+                usage_summary_altered_format["usages"].append(current_usage)
+            else:
+                usage_summary_altered_format[k] = v
+        summary[usage_type] = usage_summary_altered_format
+
+    return summary
+
+
+@deprecated_by(UsageSummaryEvent)
+@wrap_message
+class UsageSummaryMessage(BaseMessage):
+    """Usage summary message."""
+
+    actual: ActualUsageSummary
+    """Actual usage summary."""
+    total: TotalUsageSummary
+    """Total usage summary."""
+    mode: Mode
+    """Mode to display the usage summary."""
+
+    def __init__(
+        self,
+        *,
+        uuid: Optional[UUID] = None,
+        actual_usage_summary: Optional[dict[str, Any]] = None,
+        total_usage_summary: Optional[dict[str, Any]] = None,
+        mode: Mode = "both",
+    ):
+        # print(f"{actual_usage_summary=}")
+        # print(f"{total_usage_summary=}")
+
+        summary_dict = _change_usage_summary_format(actual_usage_summary, total_usage_summary)
+
+        super().__init__(uuid=uuid, **summary_dict, mode=mode)
+
+    def _print_usage(
+        self,
+        usage_summary: Union[ActualUsageSummary, TotalUsageSummary],
+        usage_type: str = "total",
+        f: Optional[Callable[..., Any]] = None,
+    ) -> None:
+        f = f or print
+        word_from_type = "including" if usage_type == "total" else "excluding"
+        if usage_summary.usages is None or len(usage_summary.usages) == 0:
+            f("No actual cost incurred (all completions are using cache).", flush=True)
+            return
+
+        f(f"Usage summary {word_from_type} cached usage: ", flush=True)
+        f(f"Total cost: {round(usage_summary.total_cost, 5)}", flush=True)  # type: ignore [arg-type]
+
+        for usage in usage_summary.usages:
+            f(
+                f"* Model '{usage.model}': cost: {round(usage.cost, 5)}, prompt_tokens: {usage.prompt_tokens}, completion_tokens: {usage.completion_tokens}, total_tokens: {usage.total_tokens}",
+                flush=True,
+            )
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        if self.total.usages is None:
+            f('No usage summary. Please call "create" first.', flush=True)
+            return
+
+        f("-" * 100, flush=True)
+        if self.mode == "both":
+            self._print_usage(self.actual, "actual", f)
+            f()
+            if self.total.model_dump_json() != self.actual.model_dump_json():
+                self._print_usage(self.total, "total", f)
+            else:
+                f(
+                    "All completions are non-cached: the total cost with cached completions is the same as actual cost.",
+                    flush=True,
+                )
+        elif self.mode == "total":
+            self._print_usage(self.total, "total", f)
+        elif self.mode == "actual":
+            self._print_usage(self.actual, "actual", f)
+        else:
+            raise ValueError(f'Invalid mode: {self.mode}, choose from "actual", "total", ["actual", "total"]')
+        f("-" * 100, flush=True)
+
+
+@deprecated_by(StreamEvent)
+@wrap_message
+class StreamMessage(BaseMessage):
+    """Stream message."""
+
+    content: str
+    """Content of the message."""
+
+    def __init__(self, *, uuid: Optional[UUID] = None, content: str) -> None:
+        super().__init__(uuid=uuid, content=content)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        # Set the terminal text color to green
+        f("\033[32m", end="")
+
+        f(self.content, end="", flush=True)
+
+        # Reset the terminal text color
+        f("\033[0m\n")
diff --git a/mm_agents/coact/autogen/messages/print_message.py b/mm_agents/coact/autogen/messages/print_message.py
new file mode 100644
index 0000000..24a6686
--- /dev/null
+++ b/mm_agents/coact/autogen/messages/print_message.py
@@ -0,0 +1,49 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import json
+from typing import Any, Callable, Optional
+from uuid import UUID
+
+from ..events import deprecated_by
+from ..events.print_event import PrintEvent
+from .base_message import BaseMessage, wrap_message
+
+
+@deprecated_by(PrintEvent)
+@wrap_message
+class PrintMessage(BaseMessage):
+    """Print message"""
+
+    objects: list[str]
+    """List of objects to print"""
+    sep: str
+    """Separator between objects"""
+    end: str
+    """End of the print"""
+
+    def __init__(
+        self, *objects: Any, sep: str = " ", end: str = "\n", flush: bool = False, uuid: Optional[UUID] = None
+    ):
+        objects_as_string = [self._to_json(x) for x in objects]
+
+        super().__init__(uuid=uuid, objects=objects_as_string, sep=sep, end=end)
+
+    def _to_json(self, obj: Any) -> str:
+        if isinstance(obj, str):
+            return obj
+
+        if hasattr(obj, "model_dump_json"):
+            return obj.model_dump_json()  # type: ignore [no-any-return]
+        try:
+            return json.dumps(obj)
+        except Exception:
+            return str(obj)
+            # return repr(obj)
+
+    def print(self, f: Optional[Callable[..., Any]] = None) -> None:
+        f = f or print
+
+        f(*self.objects, sep=self.sep, end=self.end, flush=True)
diff --git a/mm_agents/coact/autogen/oai/__init__.py b/mm_agents/coact/autogen/oai/__init__.py
new file mode 100644
index 0000000..6edc60a
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/__init__.py
@@ -0,0 +1,53 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from ..cache.cache import Cache
+from .anthropic import AnthropicLLMConfigEntry
+from .bedrock import BedrockLLMConfigEntry
+from .cerebras import CerebrasLLMConfigEntry
+from .client import AzureOpenAILLMConfigEntry, DeepSeekLLMConfigEntry, ModelClient, OpenAILLMConfigEntry, OpenAIWrapper
+from .cohere import CohereLLMConfigEntry
+from .gemini import GeminiLLMConfigEntry
+from .groq import GroqLLMConfigEntry
+from .mistral import MistralLLMConfigEntry
+from .ollama import OllamaLLMConfigEntry
+from .openai_utils import (
+    config_list_from_dotenv,
+    config_list_from_json,
+    config_list_from_models,
+    config_list_gpt4_gpt35,
+    config_list_openai_aoai,
+    filter_config,
+    get_config_list,
+    get_first_llm_config,
+)
+from .together import TogetherLLMConfigEntry
+
+__all__ = [
+    "AnthropicLLMConfigEntry",
+    "AzureOpenAILLMConfigEntry",
+    "BedrockLLMConfigEntry",
+    "Cache",
+    "CerebrasLLMConfigEntry",
+    "CohereLLMConfigEntry",
+    "DeepSeekLLMConfigEntry",
+    "GeminiLLMConfigEntry",
+    "GroqLLMConfigEntry",
+    "MistralLLMConfigEntry",
+    "ModelClient",
+    "OllamaLLMConfigEntry",
+    "OpenAILLMConfigEntry",
+    "OpenAIWrapper",
+    "TogetherLLMConfigEntry",
+    "config_list_from_dotenv",
+    "config_list_from_json",
+    "config_list_from_models",
+    "config_list_gpt4_gpt35",
+    "config_list_openai_aoai",
+    "filter_config",
+    "get_config_list",
+    "get_first_llm_config",
+]
diff --git a/mm_agents/coact/autogen/oai/anthropic.py b/mm_agents/coact/autogen/oai/anthropic.py
new file mode 100644
index 0000000..381fdeb
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/anthropic.py
@@ -0,0 +1,714 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client for the Anthropic API.
+
+Example usage:
+Install the `anthropic` package by running `pip install --upgrade anthropic`.
+- https://docs.anthropic.com/en/docs/quickstart-guide
+
+```python
+import autogen
+
+config_list = [
+    {
+        "model": "claude-3-sonnet-20240229",
+        "api_key": os.getenv("ANTHROPIC_API_KEY"),
+        "api_type": "anthropic",
+    }
+]
+
+assistant = autogen.AssistantAgent("assistant", llm_config={"config_list": config_list})
+```
+
+Example usage for Anthropic Bedrock:
+
+Install the `anthropic` package by running `pip install --upgrade anthropic`.
+- https://docs.anthropic.com/en/docs/quickstart-guide
+
+```python
+import autogen
+
+config_list = [
+    {
+        "model": "anthropic.claude-3-5-sonnet-20240620-v1:0",
+        "aws_access_key":<accessKey>,
+        "aws_secret_key":<secretKey>,
+        "aws_session_token":<sessionTok>,
+        "aws_region":"us-east-1",
+        "api_type": "anthropic",
+    }
+]
+
+assistant = autogen.AssistantAgent("assistant", llm_config={"config_list": config_list})
+```
+
+Example usage for Anthropic VertexAI:
+
+Install the `anthropic` package by running `pip install anthropic[vertex]`.
+- https://docs.anthropic.com/en/docs/quickstart-guide
+
+```python
+
+import autogen
+config_list = [
+    {
+        "model": "claude-3-5-sonnet-20240620-v1:0",
+        "gcp_project_id": "dummy_project_id",
+        "gcp_region": "us-west-2",
+        "gcp_auth_token": "dummy_auth_token",
+        "api_type": "anthropic",
+    }
+]
+
+assistant = autogen.AssistantAgent("assistant", llm_config={"config_list": config_list})
+```python
+"""
+
+from __future__ import annotations
+
+import inspect
+import json
+import os
+import re
+import time
+import warnings
+from typing import Any, Literal, Optional, Union
+
+from pydantic import BaseModel, Field
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import FormatterProtocol, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    from anthropic import Anthropic, AnthropicBedrock, AnthropicVertex
+    from anthropic import __version__ as anthropic_version
+    from anthropic.types import Message, TextBlock, ToolUseBlock
+
+    TOOL_ENABLED = anthropic_version >= "0.23.1"
+    if TOOL_ENABLED:
+        pass
+
+
+ANTHROPIC_PRICING_1k = {
+    "claude-3-7-sonnet-20250219": (0.003, 0.015),
+    "claude-3-5-sonnet-20241022": (0.003, 0.015),
+    "claude-3-5-haiku-20241022": (0.0008, 0.004),
+    "claude-3-5-sonnet-20240620": (0.003, 0.015),
+    "claude-3-sonnet-20240229": (0.003, 0.015),
+    "claude-3-opus-20240229": (0.015, 0.075),
+    "claude-3-haiku-20240307": (0.00025, 0.00125),
+    "claude-2.1": (0.008, 0.024),
+    "claude-2.0": (0.008, 0.024),
+    "claude-instant-1.2": (0.008, 0.024),
+}
+
+
+@register_llm_config
+class AnthropicLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["anthropic"] = "anthropic"
+    timeout: Optional[int] = Field(default=None, ge=1)
+    temperature: float = Field(default=1.0, ge=0.0, le=1.0)
+    top_k: Optional[int] = Field(default=None, ge=1)
+    top_p: Optional[float] = Field(default=None, ge=0.0, le=1.0)
+    stop_sequences: Optional[list[str]] = None
+    stream: bool = False
+    max_tokens: int = Field(default=4096, ge=1)
+    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
+    tool_choice: Optional[dict] = None
+    thinking: Optional[dict] = None
+
+    gcp_project_id: Optional[str] = None
+    gcp_region: Optional[str] = None
+    gcp_auth_token: Optional[str] = None
+
+    def create_client(self):
+        raise NotImplementedError("AnthropicLLMConfigEntry.create_client is not implemented.")
+
+
+@require_optional_import("anthropic", "anthropic")
+class AnthropicClient:
+    def __init__(self, **kwargs: Any):
+        """Initialize the Anthropic API client.
+
+        Args:
+            **kwargs: The configuration parameters for the client.
+        """
+        self._api_key = kwargs.get("api_key")
+        self._aws_access_key = kwargs.get("aws_access_key")
+        self._aws_secret_key = kwargs.get("aws_secret_key")
+        self._aws_session_token = kwargs.get("aws_session_token")
+        self._aws_region = kwargs.get("aws_region")
+        self._gcp_project_id = kwargs.get("gcp_project_id")
+        self._gcp_region = kwargs.get("gcp_region")
+        self._gcp_auth_token = kwargs.get("gcp_auth_token")
+        self._base_url = kwargs.get("base_url")
+
+        if not self._api_key:
+            self._api_key = os.getenv("ANTHROPIC_API_KEY")
+
+        if not self._aws_access_key:
+            self._aws_access_key = os.getenv("AWS_ACCESS_KEY")
+
+        if not self._aws_secret_key:
+            self._aws_secret_key = os.getenv("AWS_SECRET_KEY")
+
+        if not self._aws_region:
+            self._aws_region = os.getenv("AWS_REGION")
+
+        if not self._gcp_region:
+            self._gcp_region = os.getenv("GCP_REGION")
+
+        if self._api_key is None:
+            if self._aws_region:
+                if self._aws_access_key is None or self._aws_secret_key is None:
+                    raise ValueError("API key or AWS credentials are required to use the Anthropic API.")
+            elif self._gcp_region:
+                if self._gcp_project_id is None or self._gcp_region is None:
+                    raise ValueError("API key or GCP credentials are required to use the Anthropic API.")
+            else:
+                raise ValueError("API key or AWS credentials or GCP credentials are required to use the Anthropic API.")
+
+        if self._api_key is not None:
+            client_kwargs = {"api_key": self._api_key}
+            if self._base_url:
+                client_kwargs["base_url"] = self._base_url
+            self._client = Anthropic(**client_kwargs)
+        elif self._gcp_region is not None:
+            kw = {}
+            for i, p in enumerate(inspect.signature(AnthropicVertex).parameters):
+                if hasattr(self, f"_gcp_{p}"):
+                    kw[p] = getattr(self, f"_gcp_{p}")
+            if self._base_url:
+                kw["base_url"] = self._base_url
+            self._client = AnthropicVertex(**kw)
+        else:
+            client_kwargs = {
+                "aws_access_key": self._aws_access_key,
+                "aws_secret_key": self._aws_secret_key,
+                "aws_session_token": self._aws_session_token,
+                "aws_region": self._aws_region,
+            }
+            if self._base_url:
+                client_kwargs["base_url"] = self._base_url
+            self._client = AnthropicBedrock(**client_kwargs)
+
+        self._last_tooluse_status = {}
+
+        # Store the response format, if provided (for structured outputs)
+        self._response_format: Optional[type[BaseModel]] = None
+
+    def load_config(self, params: dict[str, Any]):
+        """Load the configuration for the Anthropic API client."""
+        anthropic_params = {}
+
+        anthropic_params["model"] = params.get("model")
+        assert anthropic_params["model"], "Please provide a `model` in the config_list to use the Anthropic API."
+
+        anthropic_params["temperature"] = validate_parameter(
+            params, "temperature", (float, int), False, 1.0, (0.0, 1.0), None
+        )
+        anthropic_params["max_tokens"] = validate_parameter(params, "max_tokens", int, False, 4096, (1, None), None)
+        anthropic_params["timeout"] = validate_parameter(params, "timeout", int, True, None, (1, None), None)
+        anthropic_params["top_k"] = validate_parameter(params, "top_k", int, True, None, (1, None), None)
+        anthropic_params["top_p"] = validate_parameter(params, "top_p", (float, int), True, None, (0.0, 1.0), None)
+        anthropic_params["stop_sequences"] = validate_parameter(params, "stop_sequences", list, True, None, None, None)
+        anthropic_params["stream"] = validate_parameter(params, "stream", bool, False, False, None, None)
+        if "thinking" in params:
+            anthropic_params["thinking"] = params["thinking"]
+
+        if anthropic_params["stream"]:
+            warnings.warn(
+                "Streaming is not currently supported, streaming will be disabled.",
+                UserWarning,
+            )
+            anthropic_params["stream"] = False
+
+        # Note the Anthropic API supports "tool" for tool_choice but you must specify the tool name so we will ignore that here
+        # Dictionary, see options here: https://docs.anthropic.com/en/docs/build-with-claude/tool-use/overview#controlling-claudes-output
+        # type = auto, any, tool, none | name = the name of the tool if type=tool
+        anthropic_params["tool_choice"] = validate_parameter(params, "tool_choice", dict, True, None, None, None)
+
+        return anthropic_params
+
+    def cost(self, response) -> float:
+        """Calculate the cost of the completion using the Anthropic pricing."""
+        return response.cost
+
+    @property
+    def api_key(self):
+        return self._api_key
+
+    @property
+    def aws_access_key(self):
+        return self._aws_access_key
+
+    @property
+    def aws_secret_key(self):
+        return self._aws_secret_key
+
+    @property
+    def aws_session_token(self):
+        return self._aws_session_token
+
+    @property
+    def aws_region(self):
+        return self._aws_region
+
+    @property
+    def gcp_project_id(self):
+        return self._gcp_project_id
+
+    @property
+    def gcp_region(self):
+        return self._gcp_region
+
+    @property
+    def gcp_auth_token(self):
+        return self._gcp_auth_token
+
+    def create(self, params: dict[str, Any]) -> ChatCompletion:
+        """Creates a completion using the Anthropic API."""
+        if "tools" in params:
+            converted_functions = self.convert_tools_to_functions(params["tools"])
+            params["functions"] = params.get("functions", []) + converted_functions
+
+        # Convert AG2 messages to Anthropic messages
+        anthropic_messages = oai_messages_to_anthropic_messages(params)
+        anthropic_params = self.load_config(params)
+
+        # If response_format exists, we want structured outputs
+        # Anthropic doesn't support response_format, so using Anthropic's "JSON Mode":
+        # https://github.com/anthropics/anthropic-cookbook/blob/main/misc/how_to_enable_json_mode.ipynb
+        if params.get("response_format"):
+            self._response_format = params["response_format"]
+            self._add_response_format_to_system(params)
+
+        # TODO: support stream
+        params = params.copy()
+        if "functions" in params:
+            tools_configs = params.pop("functions")
+            tools_configs = [self.openai_func_to_anthropic(tool) for tool in tools_configs]
+            params["tools"] = tools_configs
+
+        # Anthropic doesn't accept None values, so we need to use keyword argument unpacking instead of setting parameters.
+        # Copy params we need into anthropic_params
+        # Remove any that don't have values
+        anthropic_params["messages"] = anthropic_messages
+        if "system" in params:
+            anthropic_params["system"] = params["system"]
+        if "tools" in params:
+            anthropic_params["tools"] = params["tools"]
+        if anthropic_params["top_k"] is None:
+            del anthropic_params["top_k"]
+        if anthropic_params["top_p"] is None:
+            del anthropic_params["top_p"]
+        if anthropic_params["stop_sequences"] is None:
+            del anthropic_params["stop_sequences"]
+        if anthropic_params["tool_choice"] is None:
+            del anthropic_params["tool_choice"]
+
+        response = self._client.messages.create(**anthropic_params)
+
+        tool_calls = []
+        message_text = ""
+
+        if self._response_format:
+            try:
+                parsed_response = self._extract_json_response(response)
+                message_text = _format_json_response(parsed_response)
+            except ValueError as e:
+                message_text = str(e)
+
+            anthropic_finish = "stop"
+        else:
+            if response is not None:
+                # If we have tool use as the response, populate completed tool calls for our return OAI response
+                if response.stop_reason == "tool_use":
+                    anthropic_finish = "tool_calls"
+                    for content in response.content:
+                        if type(content) == ToolUseBlock:
+                            tool_calls.append(
+                                ChatCompletionMessageToolCall(
+                                    id=content.id,
+                                    function={"name": content.name, "arguments": json.dumps(content.input)},
+                                    type="function",
+                                )
+                            )
+                else:
+                    anthropic_finish = "stop"
+                    tool_calls = None
+
+                # Retrieve any text content from the response
+                for content in response.content:
+                    if type(content) == TextBlock:
+                        message_text = content.text
+                        break
+
+        # Calculate and save the cost onto the response
+        prompt_tokens = response.usage.input_tokens
+        completion_tokens = response.usage.output_tokens
+
+        # Convert output back to AG2 response format
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=message_text,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=anthropic_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response.id,
+            model=anthropic_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=prompt_tokens + completion_tokens,
+            ),
+            cost=_calculate_cost(prompt_tokens, completion_tokens, anthropic_params["model"]),
+        )
+
+        return response_oai
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    @staticmethod
+    def openai_func_to_anthropic(openai_func: dict) -> dict:
+        res = openai_func.copy()
+        res["input_schema"] = res.pop("parameters")
+        return res
+
+    @staticmethod
+    def get_usage(response: ChatCompletion) -> dict:
+        """Get the usage of tokens and their cost information."""
+        return {
+            "prompt_tokens": response.usage.prompt_tokens if response.usage is not None else 0,
+            "completion_tokens": response.usage.completion_tokens if response.usage is not None else 0,
+            "total_tokens": response.usage.total_tokens if response.usage is not None else 0,
+            "cost": response.cost if hasattr(response, "cost") else 0.0,
+            "model": response.model,
+        }
+
+    @staticmethod
+    def convert_tools_to_functions(tools: list) -> list:
+        """
+        Convert tool definitions into Anthropic-compatible functions,
+        updating nested $ref paths in property schemas.
+
+        Args:
+            tools (list): List of tool definitions.
+
+        Returns:
+            list: List of functions with updated $ref paths.
+        """
+
+        def update_refs(obj, defs_keys, prop_name):
+            """Recursively update $ref values that start with "#/$defs/"."""
+            if isinstance(obj, dict):
+                for key, value in obj.items():
+                    if key == "$ref" and isinstance(value, str) and value.startswith("#/$defs/"):
+                        ref_key = value[len("#/$defs/") :]
+                        if ref_key in defs_keys:
+                            obj[key] = f"#/properties/{prop_name}/$defs/{ref_key}"
+                    else:
+                        update_refs(value, defs_keys, prop_name)
+            elif isinstance(obj, list):
+                for item in obj:
+                    update_refs(item, defs_keys, prop_name)
+
+        functions = []
+        for tool in tools:
+            if tool.get("type") == "function" and "function" in tool:
+                function = tool["function"]
+                parameters = function.get("parameters", {})
+                properties = parameters.get("properties", {})
+                for prop_name, prop_schema in properties.items():
+                    if "$defs" in prop_schema:
+                        defs_keys = set(prop_schema["$defs"].keys())
+                        update_refs(prop_schema, defs_keys, prop_name)
+                functions.append(function)
+        return functions
+
+    def _add_response_format_to_system(self, params: dict[str, Any]):
+        """Add prompt that will generate properly formatted JSON for structured outputs to system parameter.
+
+        Based on Anthropic's JSON Mode cookbook, we ask the LLM to put the JSON within <json_response> tags.
+
+        Args:
+            params (dict): The client parameters
+        """
+        if not params.get("system"):
+            return
+
+        # Get the schema of the Pydantic model
+        if isinstance(self._response_format, dict):
+            schema = self._response_format
+        else:
+            schema = self._response_format.model_json_schema()
+
+        # Add instructions for JSON formatting
+        format_content = f"""Please provide your response as a JSON object that matches the following schema:
+{json.dumps(schema, indent=2)}
+
+Format your response as valid JSON within <json_response> tags.
+Do not include any text before or after the tags.
+Ensure the JSON is properly formatted and matches the schema exactly."""
+
+        # Add formatting to last user message
+        params["system"] += "\n\n" + format_content
+
+    def _extract_json_response(self, response: Message) -> Any:
+        """Extract and validate JSON response from the output for structured outputs.
+
+        Args:
+            response (Message): The response from the API.
+
+        Returns:
+            Any: The parsed JSON response.
+        """
+        if not self._response_format:
+            return response
+
+        # Extract content from response
+        content = response.content[0].text if response.content else ""
+
+        # Try to extract JSON from tags first
+        json_match = re.search(r"<json_response>(.*?)</json_response>", content, re.DOTALL)
+        if json_match:
+            json_str = json_match.group(1).strip()
+        else:
+            # Fallback to finding first JSON object
+            json_start = content.find("{")
+            json_end = content.rfind("}")
+            if json_start == -1 or json_end == -1:
+                raise ValueError("No valid JSON found in response for Structured Output.")
+            json_str = content[json_start : json_end + 1]
+
+        try:
+            # Parse JSON and validate against the Pydantic model if Pydantic model was provided
+            json_data = json.loads(json_str)
+            if isinstance(self._response_format, dict):
+                return json_str
+            else:
+                return self._response_format.model_validate(json_data)
+
+        except Exception as e:
+            raise ValueError(f"Failed to parse response as valid JSON matching the schema for Structured Output: {e!s}")
+
+
+def _format_json_response(response: Any) -> str:
+    """Formats the JSON response for structured outputs using the format method if it exists."""
+    if isinstance(response, str):
+        return response
+    elif isinstance(response, FormatterProtocol):
+        return response.format()
+    else:
+        return response.model_dump_json()
+
+
+def process_image_content(content_item: dict[str, Any]) -> dict[str, Any]:
+    """Process an OpenAI image content item into Claude format."""
+    if content_item["type"] != "image_url":
+        return content_item
+
+    url = content_item["image_url"]["url"]
+    try:
+        # Handle data URLs
+        if url.startswith("data:"):
+            data_url_pattern = r"data:image/([a-zA-Z]+);base64,(.+)"
+            match = re.match(data_url_pattern, url)
+            if match:
+                media_type, base64_data = match.groups()
+                return {
+                    "type": "image",
+                    "source": {"type": "base64", "media_type": f"image/{media_type}", "data": base64_data},
+                }
+
+        else:
+            print("Error processing image.")
+            # Return original content if image processing fails
+            return content_item
+
+    except Exception as e:
+        print(f"Error processing image image: {e}")
+        # Return original content if image processing fails
+        return content_item
+
+
+def process_message_content(message: dict[str, Any]) -> Union[str, list[dict[str, Any]]]:
+    """Process message content, handling both string and list formats with images."""
+    content = message.get("content", "")
+
+    # Handle empty content
+    if content == "":
+        return content
+
+    # If content is already a string, return as is
+    if isinstance(content, str):
+        return content
+
+    # Handle list content (mixed text and images)
+    if isinstance(content, list):
+        processed_content = []
+        for item in content:
+            if item["type"] == "text":
+                processed_content.append({"type": "text", "text": item["text"]})
+            elif item["type"] == "image_url":
+                processed_content.append(process_image_content(item))
+        return processed_content
+
+    return content
+
+
+@require_optional_import("anthropic", "anthropic")
+def oai_messages_to_anthropic_messages(params: dict[str, Any]) -> list[dict[str, Any]]:
+    """Convert messages from OAI format to Anthropic format.
+    We correct for any specific role orders and types, etc.
+    """
+    # Track whether we have tools passed in. If not,  tool use / result messages should be converted to text messages.
+    # Anthropic requires a tools parameter with the tools listed, if there are other messages with tool use or tool results.
+    # This can occur when we don't need tool calling, such as for group chat speaker selection.
+    has_tools = "tools" in params
+
+    # Convert messages to Anthropic compliant format
+    processed_messages = []
+
+    # Used to interweave user messages to ensure user/assistant alternating
+    user_continue_message = {"content": "Please continue.", "role": "user"}
+    assistant_continue_message = {"content": "Please continue.", "role": "assistant"}
+
+    tool_use_messages = 0
+    tool_result_messages = 0
+    last_tool_use_index = -1
+    last_tool_result_index = -1
+    for message in params["messages"]:
+        if message["role"] == "system":
+            content = process_message_content(message)
+            if isinstance(content, list):
+                # For system messages with images, concatenate only the text portions
+                text_content = " ".join(item.get("text", "") for item in content if item.get("type") == "text")
+                params["system"] = params.get("system", "") + (" " if "system" in params else "") + text_content
+            else:
+                params["system"] = params.get("system", "") + ("\n" if "system" in params else "") + content
+        else:
+            # New messages will be added here, manage role alternations
+            expected_role = "user" if len(processed_messages) % 2 == 0 else "assistant"
+
+            if "tool_calls" in message:
+                # Map the tool call options to Anthropic's ToolUseBlock
+                tool_uses = []
+                tool_names = []
+                for tool_call in message["tool_calls"]:
+                    tool_uses.append(
+                        ToolUseBlock(
+                            type="tool_use",
+                            id=tool_call["id"],
+                            name=tool_call["function"]["name"],
+                            input=json.loads(tool_call["function"]["arguments"]),
+                        )
+                    )
+                    if has_tools:
+                        tool_use_messages += 1
+                    tool_names.append(tool_call["function"]["name"])
+
+                if expected_role == "user":
+                    # Insert an extra user message as we will append an assistant message
+                    processed_messages.append(user_continue_message)
+
+                if has_tools:
+                    processed_messages.append({"role": "assistant", "content": tool_uses})
+                    last_tool_use_index = len(processed_messages) - 1
+                else:
+                    # Not using tools, so put in a plain text message
+                    processed_messages.append({
+                        "role": "assistant",
+                        "content": f"Some internal function(s) that could be used: [{', '.join(tool_names)}]",
+                    })
+            elif "tool_call_id" in message:
+                if has_tools:
+                    # Map the tool usage call to tool_result for Anthropic
+                    tool_result = {
+                        "type": "tool_result",
+                        "tool_use_id": message["tool_call_id"],
+                        "content": message["content"],
+                    }
+
+                    # If the previous message also had a tool_result, add it to that
+                    # Otherwise append a new message
+                    if last_tool_result_index == len(processed_messages) - 1:
+                        processed_messages[-1]["content"].append(tool_result)
+                    else:
+                        if expected_role == "assistant":
+                            # Insert an extra assistant message as we will append a user message
+                            processed_messages.append(assistant_continue_message)
+
+                        processed_messages.append({"role": "user", "content": [tool_result]})
+                        last_tool_result_index = len(processed_messages) - 1
+
+                    tool_result_messages += 1
+                else:
+                    # Not using tools, so put in a plain text message
+                    processed_messages.append({
+                        "role": "user",
+                        "content": f"Running the function returned: {message['content']}",
+                    })
+            elif message["content"] == "":
+                # Ignoring empty messages
+                pass
+            else:
+                if expected_role != message["role"]:
+                    # Inserting the alternating continue message
+                    processed_messages.append(
+                        user_continue_message if expected_role == "user" else assistant_continue_message
+                    )
+                # Process messages for images
+                processed_content = process_message_content(message)
+                processed_message = message.copy()
+                processed_message["content"] = processed_content
+                processed_messages.append(processed_message)
+
+    # We'll replace the last tool_use if there's no tool_result (occurs if we finish the conversation before running the function)
+    if has_tools and tool_use_messages != tool_result_messages:
+        processed_messages[last_tool_use_index] = assistant_continue_message
+
+    # name is not a valid field on messages
+    for message in processed_messages:
+        if "name" in message:
+            message.pop("name", None)
+
+    # Note: When using reflection_with_llm we may end up with an "assistant" message as the last message and that may cause a blank response
+    # So, if the last role is not user, add a 'user' continue message at the end
+    if processed_messages[-1]["role"] != "user":
+        processed_messages.append(user_continue_message)
+
+    return processed_messages
+
+
+def _calculate_cost(input_tokens: int, output_tokens: int, model: str) -> float:
+    """Calculate the cost of the completion using the Anthropic pricing."""
+    total = 0.0
+
+    if model in ANTHROPIC_PRICING_1k:
+        input_cost_per_1k, output_cost_per_1k = ANTHROPIC_PRICING_1k[model]
+        input_cost = (input_tokens / 1000) * input_cost_per_1k
+        output_cost = (output_tokens / 1000) * output_cost_per_1k
+        total = input_cost + output_cost
+    else:
+        warnings.warn(f"Cost calculation not available for model {model}", UserWarning)
+
+    return total
diff --git a/mm_agents/coact/autogen/oai/bedrock.py b/mm_agents/coact/autogen/oai/bedrock.py
new file mode 100644
index 0000000..c961fa4
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/bedrock.py
@@ -0,0 +1,628 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create a compatible client for the Amazon Bedrock Converse API.
+
+Example usage:
+Install the `boto3` package by running `pip install --upgrade boto3`.
+- https://docs.aws.amazon.com/bedrock/latest/userguide/conversation-inference.html
+
+```python
+import autogen
+
+config_list = [
+    {
+        "api_type": "bedrock",
+        "model": "meta.llama3-1-8b-instruct-v1:0",
+        "aws_region": "us-west-2",
+        "aws_access_key": "",
+        "aws_secret_key": "",
+        "price": [0.003, 0.015],
+    }
+]
+
+assistant = autogen.AssistantAgent("assistant", llm_config={"config_list": config_list})
+```
+"""
+
+from __future__ import annotations
+
+import base64
+import json
+import os
+import re
+import time
+import warnings
+from typing import Any, Literal, Optional
+
+import requests
+from pydantic import Field, SecretStr, field_serializer
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    import boto3
+    from botocore.config import Config
+
+
+@register_llm_config
+class BedrockLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["bedrock"] = "bedrock"
+    aws_region: str
+    aws_access_key: Optional[SecretStr] = None
+    aws_secret_key: Optional[SecretStr] = None
+    aws_session_token: Optional[SecretStr] = None
+    aws_profile_name: Optional[str] = None
+    temperature: Optional[float] = None
+    topP: Optional[float] = None  # noqa: N815
+    maxTokens: Optional[int] = None  # noqa: N815
+    top_p: Optional[float] = None
+    top_k: Optional[int] = None
+    k: Optional[int] = None
+    seed: Optional[int] = None
+    cache_seed: Optional[int] = None
+    supports_system_prompts: bool = True
+    stream: bool = False
+    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
+    timeout: Optional[int] = None
+
+    @field_serializer("aws_access_key", "aws_secret_key", "aws_session_token", when_used="unless-none")
+    def serialize_aws_secrets(self, v: SecretStr) -> str:
+        return v.get_secret_value()
+
+    def create_client(self):
+        raise NotImplementedError("BedrockLLMConfigEntry.create_client must be implemented.")
+
+
+@require_optional_import("boto3", "bedrock")
+class BedrockClient:
+    """Client for Amazon's Bedrock Converse API."""
+
+    _retries = 5
+
+    def __init__(self, **kwargs: Any):
+        """Initialises BedrockClient for Amazon's Bedrock Converse API"""
+        self._aws_access_key = kwargs.get("aws_access_key")
+        self._aws_secret_key = kwargs.get("aws_secret_key")
+        self._aws_session_token = kwargs.get("aws_session_token")
+        self._aws_region = kwargs.get("aws_region")
+        self._aws_profile_name = kwargs.get("aws_profile_name")
+        self._timeout = kwargs.get("timeout")
+
+        if not self._aws_access_key:
+            self._aws_access_key = os.getenv("AWS_ACCESS_KEY")
+
+        if not self._aws_secret_key:
+            self._aws_secret_key = os.getenv("AWS_SECRET_KEY")
+
+        if not self._aws_session_token:
+            self._aws_session_token = os.getenv("AWS_SESSION_TOKEN")
+
+        if not self._aws_region:
+            self._aws_region = os.getenv("AWS_REGION")
+
+        if self._aws_region is None:
+            raise ValueError("Region is required to use the Amazon Bedrock API.")
+
+        if self._timeout is None:
+            self._timeout = 60
+
+        # Initialize Bedrock client, session, and runtime
+        bedrock_config = Config(
+            region_name=self._aws_region,
+            signature_version="v4",
+            retries={"max_attempts": self._retries, "mode": "standard"},
+            read_timeout=self._timeout,
+        )
+
+        session = boto3.Session(
+            aws_access_key_id=self._aws_access_key,
+            aws_secret_access_key=self._aws_secret_key,
+            aws_session_token=self._aws_session_token,
+            profile_name=self._aws_profile_name,
+        )
+
+        if "response_format" in kwargs and kwargs["response_format"] is not None:
+            warnings.warn("response_format is not supported for Bedrock, it will be ignored.", UserWarning)
+
+        # if haven't got any access_key or secret_key in environment variable or via arguments then
+        if (
+            self._aws_access_key is None
+            or self._aws_access_key == ""
+            or self._aws_secret_key is None
+            or self._aws_secret_key == ""
+        ):
+            # attempts to get client from attached role of managed service (lambda, ec2, ecs, etc.)
+            self.bedrock_runtime = boto3.client(service_name="bedrock-runtime", config=bedrock_config)
+        else:
+            session = boto3.Session(
+                aws_access_key_id=self._aws_access_key,
+                aws_secret_access_key=self._aws_secret_key,
+                aws_session_token=self._aws_session_token,
+                profile_name=self._aws_profile_name,
+            )
+            self.bedrock_runtime = session.client(service_name="bedrock-runtime", config=bedrock_config)
+
+    def message_retrieval(self, response):
+        """Retrieve the messages from the response."""
+        return [choice.message for choice in response.choices]
+
+    def parse_custom_params(self, params: dict[str, Any]):
+        """Parses custom parameters for logic in this client class"""
+        # Should we separate system messages into its own request parameter, default is True
+        # This is required because not all models support a system prompt (e.g. Mistral Instruct).
+        self._supports_system_prompts = params.get("supports_system_prompts", True)
+
+    def parse_params(self, params: dict[str, Any]) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Loads the valid parameters required to invoke Bedrock Converse
+        Returns a tuple of (base_params, additional_params)
+        """
+        base_params = {}
+        additional_params = {}
+
+        # Amazon Bedrock  base model IDs are here:
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-ids.html
+        self._model_id = params.get("model")
+        assert self._model_id, "Please provide the 'model` in the config_list to use Amazon Bedrock"
+
+        # Parameters vary based on the model used.
+        # As we won't cater for all models and parameters, it's the developer's
+        # responsibility to implement the parameters and they will only be
+        # included if the developer has it in the config.
+        #
+        # Important:
+        # No defaults will be used (as they can vary per model)
+        # No ranges will be used (as they can vary)
+        # We will cover all the main parameters but there may be others
+        # that need to be added later
+        #
+        # Here are some pages that show the parameters available for different models
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-titan-text.html
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-anthropic-claude-text-completion.html
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-cohere-command-r-plus.html
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-meta.html
+        # https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-mistral-chat-completion.html
+
+        # Here are the possible "base" parameters and their suitable types
+        base_parameters = [["temperature", (float, int)], ["topP", (float, int)], ["maxTokens", (int)]]
+
+        for param_name, suitable_types in base_parameters:
+            if param_name in params:
+                base_params[param_name] = validate_parameter(
+                    params, param_name, suitable_types, False, None, None, None
+                )
+
+        # Here are the possible "model-specific" parameters and their suitable types, known as additional parameters
+        additional_parameters = [
+            ["top_p", (float, int)],
+            ["top_k", (int)],
+            ["k", (int)],
+            ["seed", (int)],
+        ]
+
+        for param_name, suitable_types in additional_parameters:
+            if param_name in params:
+                additional_params[param_name] = validate_parameter(
+                    params, param_name, suitable_types, False, None, None, None
+                )
+
+        # Streaming
+        self._streaming = params.get("stream", False)
+
+        # For this release we will not support streaming as many models do not support streaming with tool use
+        if self._streaming:
+            warnings.warn(
+                "Streaming is not currently supported, streaming will be disabled.",
+                UserWarning,
+            )
+            self._streaming = False
+
+        return base_params, additional_params
+
+    def create(self, params) -> ChatCompletion:
+        """Run Amazon Bedrock inference and return AG2 response"""
+        # Set custom client class settings
+        self.parse_custom_params(params)
+
+        # Parse the inference parameters
+        base_params, additional_params = self.parse_params(params)
+
+        has_tools = "tools" in params
+        messages = oai_messages_to_bedrock_messages(params["messages"], has_tools, self._supports_system_prompts)
+
+        if self._supports_system_prompts:
+            system_messages = extract_system_messages(params["messages"])
+
+        tool_config = format_tools(params["tools"] if has_tools else [])
+
+        request_args = {"messages": messages, "modelId": self._model_id}
+
+        # Base and additional args
+        if len(base_params) > 0:
+            request_args["inferenceConfig"] = base_params
+
+        if len(additional_params) > 0:
+            request_args["additionalModelRequestFields"] = additional_params
+
+        if self._supports_system_prompts:
+            request_args["system"] = system_messages
+
+        if len(tool_config["tools"]) > 0:
+            request_args["toolConfig"] = tool_config
+
+        response = self.bedrock_runtime.converse(**request_args)
+        if response is None:
+            raise RuntimeError(f"Failed to get response from Bedrock after retrying {self._retries} times.")
+
+        finish_reason = convert_stop_reason_to_finish_reason(response["stopReason"])
+        response_message = response["output"]["message"]
+
+        tool_calls = format_tool_calls(response_message["content"]) if finish_reason == "tool_calls" else None
+
+        text = ""
+        for content in response_message["content"]:
+            if "text" in content:
+                text = content["text"]
+                # NOTE: other types of output may be dealt with here
+
+        message = ChatCompletionMessage(role="assistant", content=text, tool_calls=tool_calls)
+
+        response_usage = response["usage"]
+        usage = CompletionUsage(
+            prompt_tokens=response_usage["inputTokens"],
+            completion_tokens=response_usage["outputTokens"],
+            total_tokens=response_usage["totalTokens"],
+        )
+
+        return ChatCompletion(
+            id=response["ResponseMetadata"]["RequestId"],
+            choices=[Choice(finish_reason=finish_reason, index=0, message=message)],
+            created=int(time.time()),
+            model=self._model_id,
+            object="chat.completion",
+            usage=usage,
+        )
+
+    def cost(self, response: ChatCompletion) -> float:
+        """Calculate the cost of the response."""
+        return calculate_cost(response.usage.prompt_tokens, response.usage.completion_tokens, response.model)
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Get the usage of tokens and their cost information."""
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+
+def extract_system_messages(messages: list[dict[str, Any]]) -> list:
+    """Extract the system messages from the list of messages.
+
+    Args:
+        messages (list[dict[str, Any]]): List of messages.
+
+    Returns:
+        List[SystemMessage]: List of System messages.
+    """
+    """
+    system_messages = [message.get("content")[0]["text"] for message in messages if message.get("role") == "system"]
+    return system_messages # ''.join(system_messages)
+    """
+
+    for message in messages:
+        if message.get("role") == "system":
+            if isinstance(message["content"], str):
+                return [{"text": message.get("content")}]
+            else:
+                return [{"text": message.get("content")[0]["text"]}]
+    return []
+
+
+def oai_messages_to_bedrock_messages(
+    messages: list[dict[str, Any]], has_tools: bool, supports_system_prompts: bool
+) -> list[dict[str, Any]]:
+    """Convert messages from OAI format to Bedrock format.
+    We correct for any specific role orders and types, etc.
+    AWS Bedrock requires messages to alternate between user and assistant roles. This function ensures that the messages
+    are in the correct order and format for Bedrock by inserting "Please continue" messages as needed.
+    This is the same method as the one in the Autogen Anthropic client
+    """
+    # Track whether we have tools passed in. If not,  tool use / result messages should be converted to text messages.
+    # Bedrock requires a tools parameter with the tools listed, if there are other messages with tool use or tool results.
+    # This can occur when we don't need tool calling, such as for group chat speaker selection
+
+    # Convert messages to Bedrock compliant format
+
+    # Take out system messages if the model supports it, otherwise leave them in.
+    if supports_system_prompts:
+        messages = [x for x in messages if x["role"] != "system"]
+    else:
+        # Replace role="system" with role="user"
+        for msg in messages:
+            if msg["role"] == "system":
+                msg["role"] = "user"
+
+    processed_messages = []
+
+    # Used to interweave user messages to ensure user/assistant alternating
+    user_continue_message = {"content": [{"text": "Please continue."}], "role": "user"}
+    assistant_continue_message = {
+        "content": [{"text": "Please continue."}],
+        "role": "assistant",
+    }
+
+    tool_use_messages = 0
+    tool_result_messages = 0
+    last_tool_use_index = -1
+    last_tool_result_index = -1
+    # user_role_index = 0 if supports_system_prompts else 1 # If system prompts are supported, messages start with user, otherwise they'll be the second message
+    for message in messages:
+        # New messages will be added here, manage role alternations
+        expected_role = "user" if len(processed_messages) % 2 == 0 else "assistant"
+
+        if "tool_calls" in message:
+            # Map the tool call options to Bedrock's format
+            tool_uses = []
+            tool_names = []
+            for tool_call in message["tool_calls"]:
+                tool_uses.append({
+                    "toolUse": {
+                        "toolUseId": tool_call["id"],
+                        "name": tool_call["function"]["name"],
+                        "input": json.loads(tool_call["function"]["arguments"]),
+                    }
+                })
+                if has_tools:
+                    tool_use_messages += 1
+                tool_names.append(tool_call["function"]["name"])
+
+            if expected_role == "user":
+                # Insert an extra user message as we will append an assistant message
+                processed_messages.append(user_continue_message)
+
+            if has_tools:
+                processed_messages.append({"role": "assistant", "content": tool_uses})
+                last_tool_use_index = len(processed_messages) - 1
+            else:
+                # Not using tools, so put in a plain text message
+                processed_messages.append({
+                    "role": "assistant",
+                    "content": [{"text": f"Some internal function(s) that could be used: [{', '.join(tool_names)}]"}],
+                })
+        elif "tool_call_id" in message:
+            if has_tools:
+                # Map the tool usage call to tool_result for Bedrock
+                tool_result = {
+                    "toolResult": {
+                        "toolUseId": message["tool_call_id"],
+                        "content": [{"text": message["content"]}],
+                    }
+                }
+
+                # If the previous message also had a tool_result, add it to that
+                # Otherwise append a new message
+                if last_tool_result_index == len(processed_messages) - 1:
+                    processed_messages[-1]["content"].append(tool_result)
+                else:
+                    if expected_role == "assistant":
+                        # Insert an extra assistant message as we will append a user message
+                        processed_messages.append(assistant_continue_message)
+
+                    processed_messages.append({"role": "user", "content": [tool_result]})
+                    last_tool_result_index = len(processed_messages) - 1
+
+                tool_result_messages += 1
+            else:
+                # Not using tools, so put in a plain text message
+                processed_messages.append({
+                    "role": "user",
+                    "content": [{"text": f"Running the function returned: {message['content']}"}],
+                })
+        elif message["content"] == "":
+            # Ignoring empty messages
+            pass
+        else:
+            if expected_role != message["role"] and not (len(processed_messages) == 0 and message["role"] == "system"):
+                # Inserting the alternating continue message (ignore if it's the first message and a system message)
+                processed_messages.append(
+                    user_continue_message if expected_role == "user" else assistant_continue_message
+                )
+
+            processed_messages.append({
+                "role": message["role"],
+                "content": parse_content_parts(message=message),
+            })
+
+    # We'll replace the last tool_use if there's no tool_result (occurs if we finish the conversation before running the function)
+    if has_tools and tool_use_messages != tool_result_messages:
+        processed_messages[last_tool_use_index] = assistant_continue_message
+
+    # name is not a valid field on messages
+    for message in processed_messages:
+        if "name" in message:
+            message.pop("name", None)
+
+    # Note: When using reflection_with_llm we may end up with an "assistant" message as the last message and that may cause a blank response
+    # So, if the last role is not user, add a 'user' continue message at the end
+    if processed_messages[-1]["role"] != "user":
+        processed_messages.append(user_continue_message)
+
+    return processed_messages
+
+
+def parse_content_parts(
+    message: dict[str, Any],
+) -> list[dict[str, Any]]:
+    content: str | list[dict[str, Any]] = message.get("content")
+    if isinstance(content, str):
+        return [
+            {
+                "text": content,
+            }
+        ]
+    content_parts = []
+    for part in content:
+        # part_content: Dict = part.get("content")
+        if "text" in part:  # part_content:
+            content_parts.append({
+                "text": part.get("text"),
+            })
+        elif "image_url" in part:  # part_content:
+            image_data, content_type = parse_image(part.get("image_url").get("url"))
+            content_parts.append({
+                "image": {
+                    "format": content_type[6:],  # image/
+                    "source": {"bytes": image_data},
+                },
+            })
+        else:
+            # Ignore..
+            continue
+    return content_parts
+
+
+def parse_image(image_url: str) -> tuple[bytes, str]:
+    """Try to get the raw data from an image url.
+
+    Ref: https://docs.aws.amazon.com/bedrock/latest/APIReference/API_runtime_ImageSource.html
+    returns a tuple of (Image Data, Content Type)
+    """
+    pattern = r"^data:(image/[a-z]*);base64,\s*"
+    content_type = re.search(pattern, image_url)
+    # if already base64 encoded.
+    # Only supports 'image/jpeg', 'image/png', 'image/gif' or 'image/webp'
+    if content_type:
+        image_data = re.sub(pattern, "", image_url)
+        return base64.b64decode(image_data), content_type.group(1)
+
+    # Send a request to the image URL
+    response = requests.get(image_url)
+    # Check if the request was successful
+    if response.status_code == 200:
+        content_type = response.headers.get("Content-Type")
+        if not content_type.startswith("image"):
+            content_type = "image/jpeg"
+        # Get the image content
+        image_content = response.content
+        return image_content, content_type
+    else:
+        raise RuntimeError("Unable to access the image url")
+
+
+def format_tools(tools: list[dict[str, Any]]) -> dict[Literal["tools"], list[dict[str, Any]]]:
+    converted_schema = {"tools": []}
+
+    for tool in tools:
+        if tool["type"] == "function":
+            function = tool["function"]
+            converted_tool = {
+                "toolSpec": {
+                    "name": function["name"],
+                    "description": function["description"],
+                    "inputSchema": {"json": {"type": "object", "properties": {}, "required": []}},
+                }
+            }
+
+            for prop_name, prop_details in function["parameters"]["properties"].items():
+                converted_tool["toolSpec"]["inputSchema"]["json"]["properties"][prop_name] = {
+                    "type": prop_details["type"],
+                    "description": prop_details.get("description", ""),
+                }
+                if "enum" in prop_details:
+                    converted_tool["toolSpec"]["inputSchema"]["json"]["properties"][prop_name]["enum"] = prop_details[
+                        "enum"
+                    ]
+                if "default" in prop_details:
+                    converted_tool["toolSpec"]["inputSchema"]["json"]["properties"][prop_name]["default"] = (
+                        prop_details["default"]
+                    )
+
+            if "required" in function["parameters"]:
+                converted_tool["toolSpec"]["inputSchema"]["json"]["required"] = function["parameters"]["required"]
+
+            converted_schema["tools"].append(converted_tool)
+
+    return converted_schema
+
+
+def format_tool_calls(content):
+    """Converts Converse API response tool calls to AG2 format"""
+    tool_calls = []
+    for tool_request in content:
+        if "toolUse" in tool_request:
+            tool = tool_request["toolUse"]
+
+            tool_calls.append(
+                ChatCompletionMessageToolCall(
+                    id=tool["toolUseId"],
+                    function={
+                        "name": tool["name"],
+                        "arguments": json.dumps(tool["input"]),
+                    },
+                    type="function",
+                )
+            )
+    return tool_calls
+
+
+def convert_stop_reason_to_finish_reason(
+    stop_reason: str,
+) -> Literal["stop", "length", "tool_calls", "content_filter"]:
+    """Converts Bedrock finish reasons to our finish reasons, according to OpenAI:
+
+    - stop: if the model hit a natural stop point or a provided stop sequence,
+    - length: if the maximum number of tokens specified in the request was reached,
+    - content_filter: if content was omitted due to a flag from our content filters,
+    - tool_calls: if the model called a tool
+    """
+    if stop_reason:
+        finish_reason_mapping = {
+            "tool_use": "tool_calls",
+            "finished": "stop",
+            "end_turn": "stop",
+            "max_tokens": "length",
+            "stop_sequence": "stop",
+            "complete": "stop",
+            "content_filtered": "content_filter",
+        }
+        return finish_reason_mapping.get(stop_reason.lower(), stop_reason.lower())
+
+    warnings.warn(f"Unsupported stop reason: {stop_reason}", UserWarning)
+    return None
+
+
+# NOTE: As this will be quite dynamic, it's expected that the developer will use the "price" parameter in their config
+# These may be removed.
+PRICES_PER_K_TOKENS = {
+    "meta.llama3-8b-instruct-v1:0": (0.0003, 0.0006),
+    "meta.llama3-70b-instruct-v1:0": (0.00265, 0.0035),
+    "mistral.mistral-7b-instruct-v0:2": (0.00015, 0.0002),
+    "mistral.mixtral-8x7b-instruct-v0:1": (0.00045, 0.0007),
+    "mistral.mistral-large-2402-v1:0": (0.004, 0.012),
+    "mistral.mistral-small-2402-v1:0": (0.001, 0.003),
+}
+
+
+def calculate_cost(input_tokens: int, output_tokens: int, model_id: str) -> float:
+    """Calculate the cost of the completion using the Bedrock pricing."""
+    if model_id in PRICES_PER_K_TOKENS:
+        input_cost_per_k, output_cost_per_k = PRICES_PER_K_TOKENS[model_id]
+        input_cost = (input_tokens / 1000) * input_cost_per_k
+        output_cost = (output_tokens / 1000) * output_cost_per_k
+        return input_cost + output_cost
+    else:
+        warnings.warn(
+            f'Cannot get the costs for {model_id}. The cost will be 0. In your config_list, add field {{"price" : [prompt_price_per_1k, completion_token_price_per_1k]}} for customized pricing.',
+            UserWarning,
+        )
+        return 0
diff --git a/mm_agents/coact/autogen/oai/cerebras.py b/mm_agents/coact/autogen/oai/cerebras.py
new file mode 100644
index 0000000..1f362b2
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/cerebras.py
@@ -0,0 +1,299 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Cerebras's API.
+
+Example:
+    ```python
+    llm_config = {
+        "config_list": [{"api_type": "cerebras", "model": "llama3.1-8b", "api_key": os.environ.get("CEREBRAS_API_KEY")}]
+    }
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Cerebras's python library using: pip install --upgrade cerebras_cloud_sdk
+
+Resources:
+- https://inference-docs.cerebras.ai/quickstart
+"""
+
+from __future__ import annotations
+
+import copy
+import math
+import os
+import time
+import warnings
+from typing import Any, Literal, Optional
+
+from pydantic import Field, ValidationInfo, field_validator
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import should_hide_tools, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    from cerebras.cloud.sdk import Cerebras, Stream
+
+CEREBRAS_PRICING_1K = {
+    # Convert pricing per million to per thousand tokens.
+    "llama3.1-8b": (0.10 / 1000, 0.10 / 1000),
+    "llama-3.3-70b": (0.85 / 1000, 1.20 / 1000),
+}
+
+
+@register_llm_config
+class CerebrasLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["cerebras"] = "cerebras"
+    max_tokens: Optional[int] = None
+    seed: Optional[int] = None
+    stream: bool = False
+    temperature: float = Field(default=1.0, ge=0.0, le=1.5)
+    top_p: Optional[float] = None
+    hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
+    tool_choice: Optional[Literal["none", "auto", "required"]] = None
+
+    @field_validator("top_p", mode="before")
+    @classmethod
+    def check_top_p(cls, v: Any, info: ValidationInfo) -> Any:
+        if v is not None and info.data.get("temperature") is not None:
+            raise ValueError("temperature and top_p cannot be set at the same time.")
+        return v
+
+    def create_client(self):
+        raise NotImplementedError("CerebrasLLMConfigEntry.create_client is not implemented.")
+
+
+class CerebrasClient:
+    """Client for Cerebras's API."""
+
+    def __init__(self, api_key=None, **kwargs):
+        """Requires api_key or environment variable to be set
+
+        Args:
+            api_key (str): The API key for using Cerebras (or environment variable CEREBRAS_API_KEY needs to be set)
+            **kwargs: Additional keyword arguments to pass to the Cerebras client
+        """
+        # Ensure we have the api_key upon instantiation
+        self.api_key = api_key
+        if not self.api_key:
+            self.api_key = os.getenv("CEREBRAS_API_KEY")
+
+        assert self.api_key, (
+            "Please include the api_key in your config list entry for Cerebras or set the CEREBRAS_API_KEY env variable."
+        )
+
+        if "response_format" in kwargs and kwargs["response_format"] is not None:
+            warnings.warn("response_format is not supported for Crebras, it will be ignored.", UserWarning)
+
+    def message_retrieval(self, response: ChatCompletion) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response: ChatCompletion) -> float:
+        # Note: This field isn't explicitly in `ChatCompletion`, but is injected during chat creation.
+        return response.cost
+
+    @staticmethod
+    def get_usage(response: ChatCompletion) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Cerebras API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        cerebras_params = {}
+
+        # Check that we have what we need to use Cerebras's API
+        # We won't enforce the available models as they are likely to change
+        cerebras_params["model"] = params.get("model")
+        assert cerebras_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Cerebras model to use."
+        )
+
+        # Validate allowed Cerebras parameters
+        # https://inference-docs.cerebras.ai/api-reference/chat-completions
+        cerebras_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, None, (0, None), None)
+        cerebras_params["seed"] = validate_parameter(params, "seed", int, True, None, None, None)
+        cerebras_params["stream"] = validate_parameter(params, "stream", bool, True, False, None, None)
+        cerebras_params["temperature"] = validate_parameter(
+            params, "temperature", (int, float), True, 1, (0, 1.5), None
+        )
+        cerebras_params["top_p"] = validate_parameter(params, "top_p", (int, float), True, None, None, None)
+        cerebras_params["tool_choice"] = validate_parameter(
+            params, "tool_choice", str, True, None, None, ["none", "auto", "required"]
+        )
+
+        return cerebras_params
+
+    @require_optional_import("cerebras", "cerebras")
+    def create(self, params: dict) -> ChatCompletion:
+        messages = params.get("messages", [])
+
+        # Convert AG2 messages to Cerebras messages
+        cerebras_messages = oai_messages_to_cerebras_messages(messages)
+
+        # Parse parameters to the Cerebras API's parameters
+        cerebras_params = self.parse_params(params)
+
+        # Add tools to the call if we have them and aren't hiding them
+        if "tools" in params:
+            hide_tools = validate_parameter(
+                params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
+            )
+            if not should_hide_tools(cerebras_messages, params["tools"], hide_tools):
+                cerebras_params["tools"] = params["tools"]
+
+        cerebras_params["messages"] = cerebras_messages
+
+        # We use chat model by default, and set max_retries to 5 (in line with typical retries loop)
+        client = Cerebras(api_key=self.api_key, max_retries=5)
+
+        # Token counts will be returned
+        prompt_tokens = 0
+        completion_tokens = 0
+        total_tokens = 0
+
+        # Streaming tool call recommendations
+        streaming_tool_calls = []
+
+        ans = None
+        response = client.chat.completions.create(**cerebras_params)
+
+        if cerebras_params["stream"]:
+            # Read in the chunks as they stream, taking in tool_calls which may be across
+            # multiple chunks if more than one suggested
+            ans = ""
+            for chunk in response:
+                # Grab first choice, which _should_ always be generated.
+                ans = ans + (getattr(chunk.choices[0].delta, "content", None) or "")
+
+                if "tool_calls" in chunk.choices[0].delta:
+                    # We have a tool call recommendation
+                    for tool_call in chunk.choices[0].delta["tool_calls"]:
+                        streaming_tool_calls.append(
+                            ChatCompletionMessageToolCall(
+                                id=tool_call["id"],
+                                function={
+                                    "name": tool_call["function"]["name"],
+                                    "arguments": tool_call["function"]["arguments"],
+                                },
+                                type="function",
+                            )
+                        )
+
+                if chunk.choices[0].finish_reason:
+                    prompt_tokens = chunk.usage.prompt_tokens
+                    completion_tokens = chunk.usage.completion_tokens
+                    total_tokens = chunk.usage.total_tokens
+        else:
+            # Non-streaming finished
+            ans: str = response.choices[0].message.content
+
+            prompt_tokens = response.usage.prompt_tokens
+            completion_tokens = response.usage.completion_tokens
+            total_tokens = response.usage.total_tokens
+
+        if response is not None:
+            if isinstance(response, Stream):
+                # Streaming response
+                if chunk.choices[0].finish_reason == "tool_calls":
+                    cerebras_finish = "tool_calls"
+                    tool_calls = streaming_tool_calls
+                else:
+                    cerebras_finish = "stop"
+                    tool_calls = None
+
+                response_content = ans
+                response_id = chunk.id
+            else:
+                # Non-streaming response
+                # If we have tool calls as the response, populate completed tool calls for our return OAI response
+                if response.choices[0].finish_reason == "tool_calls":
+                    cerebras_finish = "tool_calls"
+                    tool_calls = []
+                    for tool_call in response.choices[0].message.tool_calls:
+                        tool_calls.append(
+                            ChatCompletionMessageToolCall(
+                                id=tool_call.id,
+                                function={"name": tool_call.function.name, "arguments": tool_call.function.arguments},
+                                type="function",
+                            )
+                        )
+                else:
+                    cerebras_finish = "stop"
+                    tool_calls = None
+
+                response_content = response.choices[0].message.content
+                response_id = response.id
+
+        # 3. convert output
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=response_content,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=cerebras_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response_id,
+            model=cerebras_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=total_tokens,
+            ),
+            # Note: This seems to be a field that isn't in the schema of `ChatCompletion`, so Pydantic
+            #       just adds it dynamically.
+            cost=calculate_cerebras_cost(prompt_tokens, completion_tokens, cerebras_params["model"]),
+        )
+
+        return response_oai
+
+
+def oai_messages_to_cerebras_messages(messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Convert messages from OAI format to Cerebras's format.
+    We correct for any specific role orders and types.
+    """
+    cerebras_messages = copy.deepcopy(messages)
+
+    # Remove the name field
+    for message in cerebras_messages:
+        if "name" in message:
+            message.pop("name", None)
+
+    return cerebras_messages
+
+
+def calculate_cerebras_cost(input_tokens: int, output_tokens: int, model: str) -> float:
+    """Calculate the cost of the completion using the Cerebras pricing."""
+    total = 0.0
+
+    if model in CEREBRAS_PRICING_1K:
+        input_cost_per_k, output_cost_per_k = CEREBRAS_PRICING_1K[model]
+        input_cost = math.ceil((input_tokens / 1000) * input_cost_per_k * 1e6) / 1e6
+        output_cost = math.ceil((output_tokens / 1000) * output_cost_per_k * 1e6) / 1e6
+        total = math.ceil((input_cost + output_cost) * 1e6) / 1e6
+    else:
+        warnings.warn(f"Cost calculation not available for model {model}", UserWarning)
+
+    return total
diff --git a/mm_agents/coact/autogen/oai/client.py b/mm_agents/coact/autogen/oai/client.py
new file mode 100644
index 0000000..9304601
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/client.py
@@ -0,0 +1,1444 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import inspect
+import json
+import logging
+import re
+import sys
+import uuid
+import warnings
+from functools import lru_cache
+from typing import Any, Callable, Literal, Optional, Protocol, Union
+
+from pydantic import BaseModel, Field, HttpUrl, ValidationInfo, field_validator
+from pydantic.type_adapter import TypeAdapter
+
+from ..cache import Cache
+from ..doc_utils import export_module
+from ..events.client_events import StreamEvent, UsageSummaryEvent
+from ..exception_utils import ModelToolNotSupportedError
+from ..import_utils import optional_import_block, require_optional_import
+from ..io.base import IOStream
+from ..llm_config import LLMConfigEntry, register_llm_config
+from ..logger.logger_utils import get_current_ts
+from ..runtime_logging import log_chat_completion, log_new_client, log_new_wrapper, logging_enabled
+from ..token_count_utils import count_token
+from .client_utils import FormatterProtocol, logging_formatter
+from .openai_utils import OAI_PRICE1K, get_key, is_valid_api_key
+
+TOOL_ENABLED = False
+with optional_import_block() as openai_result:
+    import openai
+
+if openai_result.is_successful:
+    # raises exception if openai>=1 is installed and something is wrong with imports
+    from openai import APIError, APITimeoutError, AzureOpenAI, OpenAI
+    from openai import __version__ as openai_version
+    from openai.lib._parsing._completions import type_to_response_format_param
+    from openai.types.chat import ChatCompletion
+    from openai.types.chat.chat_completion import ChatCompletionMessage, Choice  # type: ignore [attr-defined]
+    from openai.types.chat.chat_completion_chunk import (
+        ChoiceDeltaFunctionCall,
+        ChoiceDeltaToolCall,
+        ChoiceDeltaToolCallFunction,
+    )
+    from openai.types.completion import Completion
+    from openai.types.completion_usage import CompletionUsage
+
+    if openai.__version__ >= "1.1.0":
+        TOOL_ENABLED = True
+    ERROR = None
+    from openai.lib._pydantic import _ensure_strict_json_schema
+else:
+    ERROR: Optional[ImportError] = ImportError("Please install openai>=1 and diskcache to use autogen.OpenAIWrapper.")
+
+    # OpenAI = object
+    # AzureOpenAI = object
+
+with optional_import_block() as cerebras_result:
+    from cerebras.cloud.sdk import (  # noqa
+        AuthenticationError as cerebras_AuthenticationError,
+        InternalServerError as cerebras_InternalServerError,
+        RateLimitError as cerebras_RateLimitError,
+    )
+
+    from .cerebras import CerebrasClient
+
+if cerebras_result.is_successful:
+    cerebras_import_exception: Optional[ImportError] = None
+else:
+    cerebras_AuthenticationError = cerebras_InternalServerError = cerebras_RateLimitError = Exception  # noqa: N816
+    cerebras_import_exception = ImportError("cerebras_cloud_sdk not found")
+
+with optional_import_block() as gemini_result:
+    from google.api_core.exceptions import (  # noqa
+        InternalServerError as gemini_InternalServerError,
+        ResourceExhausted as gemini_ResourceExhausted,
+    )
+
+    from .gemini import GeminiClient
+
+if gemini_result.is_successful:
+    gemini_import_exception: Optional[ImportError] = None
+else:
+    gemini_InternalServerError = gemini_ResourceExhausted = Exception  # noqa: N816
+    gemini_import_exception = ImportError("google-genai not found")
+
+with optional_import_block() as anthropic_result:
+    from anthropic import (  # noqa
+        InternalServerError as anthorpic_InternalServerError,
+        RateLimitError as anthorpic_RateLimitError,
+    )
+
+    from .anthropic import AnthropicClient
+
+if anthropic_result.is_successful:
+    anthropic_import_exception: Optional[ImportError] = None
+else:
+    anthorpic_InternalServerError = anthorpic_RateLimitError = Exception  # noqa: N816
+    anthropic_import_exception = ImportError("anthropic not found")
+
+with optional_import_block() as mistral_result:
+    from mistralai.models import (  # noqa
+        HTTPValidationError as mistral_HTTPValidationError,
+        SDKError as mistral_SDKError,
+    )
+
+    from .mistral import MistralAIClient
+
+if mistral_result.is_successful:
+    mistral_import_exception: Optional[ImportError] = None
+else:
+    mistral_SDKError = mistral_HTTPValidationError = Exception  # noqa: N816
+    mistral_import_exception = ImportError("mistralai not found")
+
+with optional_import_block() as together_result:
+    from together.error import TogetherException as together_TogetherException
+
+    from .together import TogetherClient
+
+if together_result.is_successful:
+    together_import_exception: Optional[ImportError] = None
+else:
+    together_TogetherException = Exception  # noqa: N816
+    together_import_exception = ImportError("together not found")
+
+with optional_import_block() as groq_result:
+    from groq import (  # noqa
+        APIConnectionError as groq_APIConnectionError,
+        InternalServerError as groq_InternalServerError,
+        RateLimitError as groq_RateLimitError,
+    )
+
+    from .groq import GroqClient
+
+if groq_result.is_successful:
+    groq_import_exception: Optional[ImportError] = None
+else:
+    groq_InternalServerError = groq_RateLimitError = groq_APIConnectionError = Exception  # noqa: N816
+    groq_import_exception = ImportError("groq not found")
+
+with optional_import_block() as cohere_result:
+    from cohere.errors import (  # noqa
+        InternalServerError as cohere_InternalServerError,
+        ServiceUnavailableError as cohere_ServiceUnavailableError,
+        TooManyRequestsError as cohere_TooManyRequestsError,
+    )
+
+    from .cohere import CohereClient
+
+if cohere_result.is_successful:
+    cohere_import_exception: Optional[ImportError] = None
+else:
+    cohere_InternalServerError = cohere_TooManyRequestsError = cohere_ServiceUnavailableError = Exception  # noqa: N816
+    cohere_import_exception = ImportError("cohere not found")
+
+with optional_import_block() as ollama_result:
+    from ollama import (  # noqa
+        RequestError as ollama_RequestError,
+        ResponseError as ollama_ResponseError,
+    )
+
+    from .ollama import OllamaClient
+
+if ollama_result.is_successful:
+    ollama_import_exception: Optional[ImportError] = None
+else:
+    ollama_RequestError = ollama_ResponseError = Exception  # noqa: N816
+    ollama_import_exception = ImportError("ollama not found")
+
+with optional_import_block() as bedrock_result:
+    from botocore.exceptions import (  # noqa
+        BotoCoreError as bedrock_BotoCoreError,
+        ClientError as bedrock_ClientError,
+    )
+
+    from .bedrock import BedrockClient
+
+if bedrock_result.is_successful:
+    bedrock_import_exception: Optional[ImportError] = None
+else:
+    bedrock_BotoCoreError = bedrock_ClientError = Exception  # noqa: N816
+    bedrock_import_exception = ImportError("botocore not found")
+
+logger = logging.getLogger(__name__)
+if not logger.handlers:
+    # Add the console handler.
+    _ch = logging.StreamHandler(stream=sys.stdout)
+    _ch.setFormatter(logging_formatter)
+    logger.addHandler(_ch)
+
+LEGACY_DEFAULT_CACHE_SEED = 41
+LEGACY_CACHE_DIR = ".cache"
+OPEN_API_BASE_URL_PREFIX = "https://api.openai.com"
+
+OPENAI_FALLBACK_KWARGS = {
+    "api_key",
+    "organization",
+    "project",
+    "base_url",
+    "websocket_base_url",
+    "timeout",
+    "max_retries",
+    "default_headers",
+    "default_query",
+    "http_client",
+    "_strict_response_validation",
+}
+
+AOPENAI_FALLBACK_KWARGS = {
+    "azure_endpoint",
+    "azure_deployment",
+    "api_version",
+    "api_key",
+    "azure_ad_token",
+    "azure_ad_token_provider",
+    "organization",
+    "websocket_base_url",
+    "timeout",
+    "max_retries",
+    "default_headers",
+    "default_query",
+    "http_client",
+    "_strict_response_validation",
+    "base_url",
+    "project",
+}
+
+
+@lru_cache(maxsize=128)
+def log_cache_seed_value(cache_seed_value: Union[str, int], client: "ModelClient") -> None:
+    logger.debug(f"Using cache with seed value {cache_seed_value} for client {client.__class__.__name__}")
+
+
+@register_llm_config
+class OpenAILLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["openai"] = "openai"
+    top_p: Optional[float] = None
+    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
+    tool_choice: Optional[Literal["none", "auto", "required"]] = None
+    user: Optional[str] = None
+    extra_body: Optional[dict[str, Any]] = (
+        None  # For VLLM - See here: https://docs.vllm.ai/en/latest/serving/openai_compatible_server.html#extra-parameters
+    )
+    # reasoning models - see: https://platform.openai.com/docs/api-reference/chat/create#chat-create-reasoning_effort
+    reasoning_effort: Optional[Literal["low", "medium", "high"]] = None
+    max_completion_tokens: Optional[int] = None
+
+    def create_client(self) -> "ModelClient":
+        raise NotImplementedError("create_client method must be implemented in the derived class.")
+
+
+@register_llm_config
+class AzureOpenAILLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["azure"] = "azure"
+    top_p: Optional[float] = None
+    azure_ad_token_provider: Optional[Union[str, Callable[[], str]]] = None
+    tool_choice: Optional[Literal["none", "auto", "required"]] = None
+    user: Optional[str] = None
+    # reasoning models - see:
+    # - https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/reasoning
+    # - https://learn.microsoft.com/en-us/azure/ai-services/openai/reference-preview
+    reasoning_effort: Optional[Literal["low", "medium", "high"]] = None
+    max_completion_tokens: Optional[int] = None
+
+    def create_client(self) -> "ModelClient":
+        raise NotImplementedError
+
+
+@register_llm_config
+class DeepSeekLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["deepseek"] = "deepseek"
+    base_url: HttpUrl = HttpUrl("https://api.deepseek.com/v1")
+    temperature: float = Field(0.5, ge=0.0, le=1.0)
+    max_tokens: int = Field(8192, ge=1, le=8192)
+    top_p: Optional[float] = Field(None, ge=0.0, le=1.0)
+    tool_choice: Optional[Literal["none", "auto", "required"]] = None
+
+    @field_validator("top_p", mode="before")
+    @classmethod
+    def check_top_p(cls, v: Any, info: ValidationInfo) -> Any:
+        if v is not None and info.data.get("temperature") is not None:
+            raise ValueError("temperature and top_p cannot be set at the same time.")
+        return v
+
+    def create_client(self) -> None:  # type: ignore [override]
+        raise NotImplementedError("DeepSeekLLMConfigEntry.create_client is not implemented.")
+
+
+@export_module("autogen")
+class ModelClient(Protocol):
+    """A client class must implement the following methods:
+    - create must return a response object that implements the ModelClientResponseProtocol
+    - cost must return the cost of the response
+    - get_usage must return a dict with the following keys:
+        - prompt_tokens
+        - completion_tokens
+        - total_tokens
+        - cost
+        - model
+
+    This class is used to create a client that can be used by OpenAIWrapper.
+    The response returned from create must adhere to the ModelClientResponseProtocol but can be extended however needed.
+    The message_retrieval method must be implemented to return a list of str or a list of messages from the response.
+    """
+
+    RESPONSE_USAGE_KEYS = ["prompt_tokens", "completion_tokens", "total_tokens", "cost", "model"]
+
+    class ModelClientResponseProtocol(Protocol):
+        class Choice(Protocol):
+            class Message(Protocol):
+                content: Optional[str]
+
+            message: Message
+
+        choices: list[Choice]
+        model: str
+
+    def create(self, params: dict[str, Any]) -> ModelClientResponseProtocol: ...  # pragma: no cover
+
+    def message_retrieval(
+        self, response: ModelClientResponseProtocol
+    ) -> Union[list[str], list[ModelClient.ModelClientResponseProtocol.Choice.Message]]:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        ...  # pragma: no cover
+
+    def cost(self, response: ModelClientResponseProtocol) -> float: ...  # pragma: no cover
+
+    @staticmethod
+    def get_usage(response: ModelClientResponseProtocol) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        ...  # pragma: no cover
+
+
+class PlaceHolderClient:
+    def __init__(self, config):
+        self.config = config
+
+
+@require_optional_import("openai>=1.66.2", "openai")
+class OpenAIClient:
+    """Follows the Client protocol and wraps the OpenAI client."""
+
+    def __init__(
+        self, client: Union[OpenAI, AzureOpenAI], response_format: Union[BaseModel, dict[str, Any], None] = None
+    ):
+        self._oai_client = client
+        self.response_format = response_format
+        if (
+            not isinstance(client, openai.AzureOpenAI)
+            and str(client.base_url).startswith(OPEN_API_BASE_URL_PREFIX)
+            and not is_valid_api_key(self._oai_client.api_key)
+        ):
+            logger.warning(
+                "The API key specified is not a valid OpenAI format; it won't work with the OpenAI-hosted model."
+            )
+
+    def message_retrieval(
+        self, response: Union[ChatCompletion, Completion]
+    ) -> Union[list[str], list[ChatCompletionMessage]]:
+        """Retrieve the messages from the response.
+
+        Args:
+            response (ChatCompletion | Completion): The response from openai.
+
+
+        Returns:
+            The message from the response.
+        """
+        choices = response.choices
+        if isinstance(response, Completion):
+            return [choice.text for choice in choices]  # type: ignore [union-attr]
+
+        def _format_content(content: str) -> str:
+            return (
+                self.response_format.model_validate_json(content).format()
+                if isinstance(self.response_format, FormatterProtocol)
+                else content
+            )
+
+        if TOOL_ENABLED:
+            return [  # type: ignore [return-value]
+                (
+                    choice.message  # type: ignore [union-attr]
+                    if choice.message.function_call is not None or choice.message.tool_calls is not None  # type: ignore [union-attr]
+                    else _format_content(choice.message.content)
+                )  # type: ignore [union-attr]
+                for choice in choices
+            ]
+        else:
+            return [  # type: ignore [return-value]
+                choice.message if choice.message.function_call is not None else _format_content(choice.message.content)  # type: ignore [union-attr]
+                for choice in choices
+            ]
+
+    @staticmethod
+    def _is_agent_name_error_message(message: str) -> bool:
+        pattern = re.compile(r"Invalid 'messages\[\d+\]\.name': string does not match pattern.")
+        return bool(pattern.match(message))
+
+    @staticmethod
+    def _move_system_message_to_beginning(messages: list[dict[str, Any]]) -> None:
+        for msg in messages:
+            if msg["role"] == "system":
+                messages.insert(0, messages.pop(messages.index(msg)))
+                break
+
+    @staticmethod
+    def _patch_messages_for_deepseek_reasoner(**kwargs: Any) -> Any:
+        if (
+            "model" not in kwargs
+            or kwargs["model"] != "deepseek-reasoner"
+            or "messages" not in kwargs
+            or len(kwargs["messages"]) == 0
+        ):
+            return kwargs
+
+        # The system message of deepseek-reasoner must be put on the beginning of the message sequence.
+        OpenAIClient._move_system_message_to_beginning(kwargs["messages"])
+
+        new_messages = []
+        previous_role = None
+        for message in kwargs["messages"]:
+            if "role" in message:
+                current_role = message["role"]
+
+                # This model requires alternating roles
+                if current_role == previous_role:
+                    # Swap the role
+                    if current_role == "user":
+                        message["role"] = "assistant"
+                    elif current_role == "assistant":
+                        message["role"] = "user"
+
+                previous_role = message["role"]
+
+            new_messages.append(message)
+
+        # The last message of deepseek-reasoner must be a user message
+        # , or an assistant message with prefix mode on (but this is supported only for beta api)
+        if new_messages[-1]["role"] != "user":
+            new_messages.append({"role": "user", "content": "continue"})
+
+        kwargs["messages"] = new_messages
+
+        return kwargs
+
+    @staticmethod
+    def _handle_openai_bad_request_error(func: Callable[..., Any]) -> Callable[..., Any]:
+        def wrapper(*args: Any, **kwargs: Any):
+            try:
+                kwargs = OpenAIClient._patch_messages_for_deepseek_reasoner(**kwargs)
+                return func(*args, **kwargs)
+            except openai.BadRequestError as e:
+                response_json = e.response.json()
+                # Check if the error message is related to the agent name. If so, raise a ValueError with a more informative message.
+                if (
+                    "error" in response_json
+                    and "message" in response_json["error"]
+                    and OpenAIClient._is_agent_name_error_message(response_json["error"]["message"])
+                ):
+                    error_message = (
+                        f"This error typically occurs when the agent name contains invalid characters, such as spaces or special symbols.\n"
+                        "Please ensure that your agent name follows the correct format and doesn't include any unsupported characters.\n"
+                        "Check the agent name and try again.\n"
+                        f"Here is the full BadRequestError from openai:\n{e.message}."
+                    )
+                    raise ValueError(error_message)
+
+                raise e
+
+        return wrapper
+
+    @staticmethod
+    def _convert_system_role_to_user(messages: list[dict[str, Any]]) -> None:
+        for msg in messages:
+            if msg.get("role", "") == "system":
+                msg["role"] = "user"
+
+    def create(self, params: dict[str, Any]) -> ChatCompletion:
+        """Create a completion for a given config using openai's client.
+
+        Args:
+            params: The params for the completion.
+
+        Returns:
+            The completion.
+        """
+        iostream = IOStream.get_default()
+
+        if self.response_format is not None or "response_format" in params:
+
+            def _create_or_parse(*args, **kwargs):
+                if "stream" in kwargs:
+                    kwargs.pop("stream")
+
+                if isinstance(kwargs["response_format"], dict):
+                    kwargs["response_format"] = {
+                        "type": "json_schema",
+                        "json_schema": {
+                            "schema": _ensure_strict_json_schema(
+                                kwargs["response_format"], path=(), root=kwargs["response_format"]
+                            ),
+                            "name": "response_format",
+                            "strict": True,
+                        },
+                    }
+                else:
+                    kwargs["response_format"] = type_to_response_format_param(
+                        self.response_format or params["response_format"]
+                    )
+
+                return self._oai_client.chat.completions.create(*args, **kwargs)
+
+            create_or_parse = _create_or_parse
+        else:
+            completions = self._oai_client.chat.completions if "messages" in params else self._oai_client.completions  # type: ignore [attr-defined]
+            create_or_parse = completions.create
+        # Wrap _create_or_parse with exception handling
+        create_or_parse = OpenAIClient._handle_openai_bad_request_error(create_or_parse)
+
+        # needs to be updated when the o3 is released to generalize
+        is_o1 = "model" in params and params["model"].startswith("o1")
+
+        is_mistral = "model" in params and "mistral" in params["model"]
+        if is_mistral:
+            OpenAIClient._convert_system_role_to_user(params["messages"])
+
+        # If streaming is enabled and has messages, then iterate over the chunks of the response.
+        if params.get("stream", False) and "messages" in params and not is_o1:
+            response_contents = [""] * params.get("n", 1)
+            finish_reasons = [""] * params.get("n", 1)
+            completion_tokens = 0
+
+            # Prepare for potential function call
+            full_function_call: Optional[dict[str, Any]] = None
+            full_tool_calls: Optional[list[Optional[dict[str, Any]]]] = None
+
+            # Send the chat completion request to OpenAI's API and process the response in chunks
+            for chunk in create_or_parse(**params):
+                if chunk.choices:
+                    for choice in chunk.choices:
+                        content = choice.delta.content
+                        tool_calls_chunks = choice.delta.tool_calls
+                        finish_reasons[choice.index] = choice.finish_reason
+
+                        # todo: remove this after function calls are removed from the API
+                        # the code should work regardless of whether function calls are removed or not, but test_chat_functions_stream should fail
+                        # begin block
+                        function_call_chunk = (
+                            choice.delta.function_call if hasattr(choice.delta, "function_call") else None
+                        )
+                        # Handle function call
+                        if function_call_chunk:
+                            # Handle function call
+                            if function_call_chunk:
+                                full_function_call, completion_tokens = OpenAIWrapper._update_function_call_from_chunk(
+                                    function_call_chunk, full_function_call, completion_tokens
+                                )
+                            if not content:
+                                continue
+                        # end block
+
+                        # Handle tool calls
+                        if tool_calls_chunks:
+                            for tool_calls_chunk in tool_calls_chunks:
+                                # the current tool call to be reconstructed
+                                ix = tool_calls_chunk.index
+                                if full_tool_calls is None:
+                                    full_tool_calls = []
+                                if ix >= len(full_tool_calls):
+                                    # in case ix is not sequential
+                                    full_tool_calls = full_tool_calls + [None] * (ix - len(full_tool_calls) + 1)
+
+                                full_tool_calls[ix], completion_tokens = OpenAIWrapper._update_tool_calls_from_chunk(
+                                    tool_calls_chunk, full_tool_calls[ix], completion_tokens
+                                )
+                                if not content:
+                                    continue
+
+                        # End handle tool calls
+
+                        # If content is present, print it to the terminal and update response variables
+                        if content is not None:
+                            iostream.send(StreamEvent(content=content))
+                            response_contents[choice.index] += content
+                            completion_tokens += 1
+                        else:
+                            pass
+
+            # Prepare the final ChatCompletion object based on the accumulated data
+            model = chunk.model.replace("gpt-35", "gpt-3.5")  # hack for Azure API
+            prompt_tokens = count_token(params["messages"], model)
+            response = ChatCompletion(
+                id=chunk.id,
+                model=chunk.model,
+                created=chunk.created,
+                object="chat.completion",
+                choices=[],
+                usage=CompletionUsage(
+                    prompt_tokens=prompt_tokens,
+                    completion_tokens=completion_tokens,
+                    total_tokens=prompt_tokens + completion_tokens,
+                ),
+            )
+            for i in range(len(response_contents)):
+                if openai_version >= "1.5":  # pragma: no cover
+                    # OpenAI versions 1.5.0 and above
+                    choice = Choice(
+                        index=i,
+                        finish_reason=finish_reasons[i],
+                        message=ChatCompletionMessage(
+                            role="assistant",
+                            content=response_contents[i],
+                            function_call=full_function_call,
+                            tool_calls=full_tool_calls,
+                        ),
+                        logprobs=None,
+                    )
+                else:
+                    # OpenAI versions below 1.5.0
+                    choice = Choice(  # type: ignore [call-arg]
+                        index=i,
+                        finish_reason=finish_reasons[i],
+                        message=ChatCompletionMessage(
+                            role="assistant",
+                            content=response_contents[i],
+                            function_call=full_function_call,
+                            tool_calls=full_tool_calls,
+                        ),
+                    )
+
+                response.choices.append(choice)
+        else:
+            # If streaming is not enabled, send a regular chat completion request
+            params = params.copy()
+            if is_o1:
+                # add a warning that model does not support stream
+                if params.get("stream", False):
+                    warnings.warn(
+                        f"The {params.get('model')} model does not support streaming. The stream will be set to False."
+                    )
+                if params.get("tools", False):
+                    raise ModelToolNotSupportedError(params.get("model"))
+                self._process_reasoning_model_params(params)
+            params["stream"] = False
+            response = create_or_parse(**params)
+            # remove the system_message from the response and add it in the prompt at the start.
+            if is_o1:
+                for msg in params["messages"]:
+                    if msg["role"] == "user" and msg["content"].startswith("System message: "):
+                        msg["role"] = "system"
+                        msg["content"] = msg["content"][len("System message: ") :]
+
+        return response
+
+    def _process_reasoning_model_params(self, params: dict[str, Any]) -> None:
+        """Cater for the reasoning model (o1, o3..) parameters
+        please refer: https://platform.openai.com/docs/guides/reasoning#limitations
+        """
+        # Unsupported parameters
+        unsupported_params = [
+            "temperature",
+            "frequency_penalty",
+            "presence_penalty",
+            "top_p",
+            "logprobs",
+            "top_logprobs",
+            "logit_bias",
+        ]
+        model_name = params.get("model")
+        for param in unsupported_params:
+            if param in params:
+                warnings.warn(f"`{param}` is not supported with {model_name} model and will be ignored.")
+                params.pop(param)
+        # Replace max_tokens with max_completion_tokens as reasoning tokens are now factored in
+        # and max_tokens isn't valid
+        if "max_tokens" in params:
+            params["max_completion_tokens"] = params.pop("max_tokens")
+
+        # TODO - When o1-mini and o1-preview point to newer models (e.g. 2024-12-...), remove them from this list but leave the 2024-09-12 dated versions
+        system_not_allowed = model_name in ("o1-mini", "o1-preview", "o1-mini-2024-09-12", "o1-preview-2024-09-12")
+
+        if "messages" in params and system_not_allowed:
+            # o1-mini (2024-09-12) and o1-preview (2024-09-12) don't support role='system' messages, only 'user' and 'assistant'
+            # replace the system messages with user messages preappended with "System message: "
+            for msg in params["messages"]:
+                if msg["role"] == "system":
+                    msg["role"] = "user"
+                    msg["content"] = f"System message: {msg['content']}"
+
+    def cost(self, response: Union[ChatCompletion, Completion]) -> float:
+        """Calculate the cost of the response."""
+        model = response.model
+        if model not in OAI_PRICE1K:
+            # log warning that the model is not found
+            logger.warning(
+                f'Model {model} is not found. The cost will be 0. In your config_list, add field {{"price" : [prompt_price_per_1k, completion_token_price_per_1k]}} for customized pricing.'
+            )
+            return 0
+
+        n_input_tokens = response.usage.prompt_tokens if response.usage is not None else 0  # type: ignore [union-attr]
+        n_output_tokens = response.usage.completion_tokens if response.usage is not None else 0  # type: ignore [union-attr]
+        if n_output_tokens is None:
+            n_output_tokens = 0
+        tmp_price1K = OAI_PRICE1K[model]  # noqa: N806
+        # First value is input token rate, second value is output token rate
+        if isinstance(tmp_price1K, tuple):
+            return (tmp_price1K[0] * n_input_tokens + tmp_price1K[1] * n_output_tokens) / 1000  # type: ignore [no-any-return]
+        return tmp_price1K * (n_input_tokens + n_output_tokens) / 1000  # type: ignore [operator]
+
+    @staticmethod
+    def get_usage(response: Union[ChatCompletion, Completion]) -> dict:
+        return {
+            "prompt_tokens": response.usage.prompt_tokens if response.usage is not None else 0,
+            "completion_tokens": response.usage.completion_tokens if response.usage is not None else 0,
+            "total_tokens": response.usage.total_tokens if response.usage is not None else 0,
+            "cost": response.cost if hasattr(response, "cost") else 0,
+            "model": response.model,
+        }
+
+
+@export_module("autogen")
+class OpenAIWrapper:
+    """A wrapper class for openai client."""
+
+    extra_kwargs = {
+        "agent",
+        "cache",
+        "cache_seed",
+        "filter_func",
+        "allow_format_str_template",
+        "context",
+        "api_version",
+        "api_type",
+        "tags",
+        "price",
+    }
+
+    @property
+    def openai_kwargs(self) -> set[str]:
+        if openai_result.is_successful:
+            return set(inspect.getfullargspec(OpenAI.__init__).kwonlyargs) | set(
+                inspect.getfullargspec(AzureOpenAI.__init__).kwonlyargs
+            )
+        else:
+            return OPENAI_FALLBACK_KWARGS | AOPENAI_FALLBACK_KWARGS
+
+    total_usage_summary: Optional[dict[str, Any]] = None
+    actual_usage_summary: Optional[dict[str, Any]] = None
+
+    def __init__(
+        self,
+        *,
+        config_list: Optional[list[dict[str, Any]]] = None,
+        **base_config: Any,
+    ):
+        """Initialize the OpenAIWrapper.
+
+        Args:
+            config_list: a list of config dicts to override the base_config.
+                They can contain additional kwargs as allowed in the [create](https://docs.ag2.ai/latest/docs/api-reference/autogen/OpenAIWrapper/#autogen.OpenAIWrapper.create) method. E.g.,
+
+                ```python
+                    config_list = [
+                        {
+                            "model": "gpt-4",
+                            "api_key": os.environ.get("AZURE_OPENAI_API_KEY"),
+                            "api_type": "azure",
+                            "base_url": os.environ.get("AZURE_OPENAI_API_BASE"),
+                            "api_version": "2024-02-01",
+                        },
+                        {
+                            "model": "gpt-3.5-turbo",
+                            "api_key": os.environ.get("OPENAI_API_KEY"),
+                            "base_url": "https://api.openai.com/v1",
+                        },
+                        {
+                            "model": "llama-7B",
+                            "base_url": "http://127.0.0.1:8080",
+                        },
+                    ]
+                ```
+
+            base_config: base config. It can contain both keyword arguments for openai client
+                and additional kwargs.
+                When using OpenAI or Azure OpenAI endpoints, please specify a non-empty 'model' either in `base_config` or in each config of `config_list`.
+        """
+        if logging_enabled():
+            log_new_wrapper(self, locals())
+        openai_config, extra_kwargs = self._separate_openai_config(base_config)
+        # It's OK if "model" is not provided in base_config or config_list
+        # Because one can provide "model" at `create` time.
+
+        self._clients: list[ModelClient] = []
+        self._config_list: list[dict[str, Any]] = []
+
+        if config_list:
+            config_list = [config.copy() for config in config_list]  # make a copy before modifying
+            for config in config_list:
+                self._register_default_client(config, openai_config)  # could modify the config
+                self._config_list.append({
+                    **extra_kwargs,
+                    **{k: v for k, v in config.items() if k not in self.openai_kwargs},
+                })
+        else:
+            self._register_default_client(extra_kwargs, openai_config)
+            self._config_list = [extra_kwargs]
+        self.wrapper_id = id(self)
+
+    def _separate_openai_config(self, config: dict[str, Any]) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Separate the config into openai_config and extra_kwargs."""
+        openai_config = {k: v for k, v in config.items() if k in self.openai_kwargs}
+        extra_kwargs = {k: v for k, v in config.items() if k not in self.openai_kwargs}
+        return openai_config, extra_kwargs
+
+    def _separate_create_config(self, config: dict[str, Any]) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Separate the config into create_config and extra_kwargs."""
+        create_config = {k: v for k, v in config.items() if k not in self.extra_kwargs}
+        extra_kwargs = {k: v for k, v in config.items() if k in self.extra_kwargs}
+        return create_config, extra_kwargs
+
+    def _configure_azure_openai(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
+        openai_config["azure_deployment"] = openai_config.get("azure_deployment", config.get("model"))
+        if openai_config["azure_deployment"] is not None:
+            # Preserve dots for specific model versions that require them
+            deployment_name = openai_config["azure_deployment"]
+            if deployment_name in [
+                "gpt-4.1"
+            ]:  # Add more as needed, Whitelist approach so as to not break existing deployments
+                # Keep the deployment name as-is for these specific models
+                pass
+            else:
+                # Remove dots for all other models (maintain existing behavior)
+                openai_config["azure_deployment"] = deployment_name.replace(".", "")
+        openai_config["azure_endpoint"] = openai_config.get("azure_endpoint", openai_config.pop("base_url", None))
+
+        # Create a default Azure token provider if requested
+        if openai_config.get("azure_ad_token_provider") == "DEFAULT":
+            import azure.identity
+
+            openai_config["azure_ad_token_provider"] = azure.identity.get_bearer_token_provider(
+                azure.identity.DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default"
+            )
+
+    def _configure_openai_config_for_bedrock(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
+        """Update openai_config with AWS credentials from config."""
+        required_keys = ["aws_access_key", "aws_secret_key", "aws_region"]
+        optional_keys = ["aws_session_token", "aws_profile_name"]
+        for key in required_keys:
+            if key in config:
+                openai_config[key] = config[key]
+        for key in optional_keys:
+            if key in config:
+                openai_config[key] = config[key]
+
+    def _configure_openai_config_for_vertextai(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
+        """Update openai_config with Google credentials from config."""
+        required_keys = ["gcp_project_id", "gcp_region", "gcp_auth_token"]
+        for key in required_keys:
+            if key in config:
+                openai_config[key] = config[key]
+
+    def _register_default_client(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
+        """Create a client with the given config to override openai_config,
+        after removing extra kwargs.
+
+        For Azure models/deployment names there's a convenience modification of model removing dots in
+        the it's value (Azure deployment names can't have dots). I.e. if you have Azure deployment name
+        "gpt-35-turbo" and define model "gpt-3.5-turbo" in the config the function will remove the dot
+        from the name and create a client that connects to "gpt-35-turbo" Azure deployment.
+        """
+        openai_config = {**openai_config, **{k: v for k, v in config.items() if k in self.openai_kwargs}}
+        api_type = config.get("api_type")
+        model_client_cls_name = config.get("model_client_cls")
+        response_format = config.get("response_format")
+        if model_client_cls_name is not None:
+            # a config for a custom client is set
+            # adding placeholder until the register_model_client is called with the appropriate class
+            self._clients.append(PlaceHolderClient(config))
+            logger.info(
+                f"Detected custom model client in config: {model_client_cls_name}, model client can not be used until register_model_client is called."
+            )
+            # TODO: logging for custom client
+        else:
+            if api_type is not None and api_type.startswith("azure"):
+
+                @require_optional_import("openai>=1.66.2", "openai")
+                def create_azure_openai_client() -> "AzureOpenAI":
+                    self._configure_azure_openai(config, openai_config)
+                    client = AzureOpenAI(**openai_config)
+                    self._clients.append(OpenAIClient(client, response_format=response_format))
+                    return client
+
+                client = create_azure_openai_client()
+            elif api_type is not None and api_type.startswith("cerebras"):
+                if cerebras_import_exception:
+                    raise ImportError("Please install `cerebras_cloud_sdk` to use Cerebras OpenAI API.")
+                client = CerebrasClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("google"):
+                if gemini_import_exception:
+                    raise ImportError("Please install `google-genai` and 'vertexai' to use Google's API.")
+                client = GeminiClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("anthropic"):
+                if "api_key" not in config and "aws_region" in config:
+                    self._configure_openai_config_for_bedrock(config, openai_config)
+                elif "api_key" not in config and "gcp_region" in config:
+                    self._configure_openai_config_for_vertextai(config, openai_config)
+                if anthropic_import_exception:
+                    raise ImportError("Please install `anthropic` to use Anthropic API.")
+                client = AnthropicClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("mistral"):
+                if mistral_import_exception:
+                    raise ImportError("Please install `mistralai` to use the Mistral.AI API.")
+                client = MistralAIClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("together"):
+                if together_import_exception:
+                    raise ImportError("Please install `together` to use the Together.AI API.")
+                client = TogetherClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("groq"):
+                if groq_import_exception:
+                    raise ImportError("Please install `groq` to use the Groq API.")
+                client = GroqClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("cohere"):
+                if cohere_import_exception:
+                    raise ImportError("Please install `cohere` to use the Cohere API.")
+                client = CohereClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("ollama"):
+                if ollama_import_exception:
+                    raise ImportError("Please install `ollama` and `fix-busted-json` to use the Ollama API.")
+                client = OllamaClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            elif api_type is not None and api_type.startswith("bedrock"):
+                self._configure_openai_config_for_bedrock(config, openai_config)
+                if bedrock_import_exception:
+                    raise ImportError("Please install `boto3` to use the Amazon Bedrock API.")
+                client = BedrockClient(response_format=response_format, **openai_config)
+                self._clients.append(client)
+            else:
+
+                @require_optional_import("openai>=1.66.2", "openai")
+                def create_openai_client() -> "OpenAI":
+                    client = OpenAI(**openai_config)
+                    self._clients.append(OpenAIClient(client, response_format))
+                    return client
+
+                client = create_openai_client()
+
+            if logging_enabled():
+                log_new_client(client, self, openai_config)
+
+    def register_model_client(self, model_client_cls: ModelClient, **kwargs: Any):
+        """Register a model client.
+
+        Args:
+            model_client_cls: A custom client class that follows the ModelClient interface
+            kwargs: The kwargs for the custom client class to be initialized with
+        """
+        existing_client_class = False
+        for i, client in enumerate(self._clients):
+            if isinstance(client, PlaceHolderClient):
+                placeholder_config = client.config
+
+                if placeholder_config.get("model_client_cls") == model_client_cls.__name__:
+                    self._clients[i] = model_client_cls(placeholder_config, **kwargs)
+                    return
+            elif isinstance(client, model_client_cls):
+                existing_client_class = True
+
+        if existing_client_class:
+            logger.warning(
+                f"Model client {model_client_cls.__name__} is already registered. Add more entries in the config_list to use multiple model clients."
+            )
+        else:
+            raise ValueError(
+                f'Model client "{model_client_cls.__name__}" is being registered but was not found in the config_list. '
+                f'Please make sure to include an entry in the config_list with "model_client_cls": "{model_client_cls.__name__}"'
+            )
+
+    @classmethod
+    def instantiate(
+        cls,
+        template: Optional[Union[str, Callable[[dict[str, Any]], str]]],
+        context: Optional[dict[str, Any]] = None,
+        allow_format_str_template: Optional[bool] = False,
+    ) -> Optional[str]:
+        if not context or template is None:
+            return template  # type: ignore [return-value]
+        if isinstance(template, str):
+            return template.format(**context) if allow_format_str_template else template
+        return template(context)
+
+    def _construct_create_params(self, create_config: dict[str, Any], extra_kwargs: dict[str, Any]) -> dict[str, Any]:
+        """Prime the create_config with additional_kwargs."""
+        # Validate the config
+        prompt: Optional[str] = create_config.get("prompt")
+        messages: Optional[list[dict[str, Any]]] = create_config.get("messages")
+        if (prompt is None) == (messages is None):
+            raise ValueError("Either prompt or messages should be in create config but not both.")
+        context = extra_kwargs.get("context")
+        if context is None:
+            # No need to instantiate if no context is provided.
+            return create_config
+        # Instantiate the prompt or messages
+        allow_format_str_template = extra_kwargs.get("allow_format_str_template", False)
+        # Make a copy of the config
+        params = create_config.copy()
+        if prompt is not None:
+            # Instantiate the prompt
+            params["prompt"] = self.instantiate(prompt, context, allow_format_str_template)
+        elif context:
+            # Instantiate the messages
+            params["messages"] = [
+                (
+                    {
+                        **m,
+                        "content": self.instantiate(m["content"], context, allow_format_str_template),
+                    }
+                    if m.get("content")
+                    else m
+                )
+                for m in messages  # type: ignore [union-attr]
+            ]
+        return params
+
+    def create(self, **config: Any) -> ModelClient.ModelClientResponseProtocol:
+        """Make a completion for a given config using available clients.
+        Besides the kwargs allowed in openai's [or other] client, we allow the following additional kwargs.
+        The config in each client will be overridden by the config.
+
+        Args:
+            **config: The config for the completion.
+
+        Raises:
+            RuntimeError: If all declared custom model clients are not registered
+            APIError: If any model client create call raises an APIError
+        """
+        # if ERROR:
+        #     raise ERROR
+        invocation_id = str(uuid.uuid4())
+        last = len(self._clients) - 1
+        # Check if all configs in config list are activated
+        non_activated = [
+            client.config["model_client_cls"] for client in self._clients if isinstance(client, PlaceHolderClient)
+        ]
+        if non_activated:
+            raise RuntimeError(
+                f"Model client(s) {non_activated} are not activated. Please register the custom model clients using `register_model_client` or filter them out form the config list."
+            )
+        for i, client in enumerate(self._clients):
+            # merge the input config with the i-th config in the config list
+            full_config = {**config, **self._config_list[i]}
+            # separate the config into create_config and extra_kwargs
+            create_config, extra_kwargs = self._separate_create_config(full_config)
+            api_type = extra_kwargs.get("api_type")
+            if api_type and api_type.startswith("azure") and "model" in create_config:
+                create_config["model"] = create_config["model"].replace(".", "")
+            # construct the create params
+            params = self._construct_create_params(create_config, extra_kwargs)
+            # get the cache_seed, filter_func and context
+            cache_seed = extra_kwargs.get("cache_seed")
+            cache = extra_kwargs.get("cache")
+            filter_func = extra_kwargs.get("filter_func")
+            context = extra_kwargs.get("context")
+            agent = extra_kwargs.get("agent")
+            price = extra_kwargs.get("price", None)
+            if isinstance(price, list):
+                price = tuple(price)
+            elif isinstance(price, (float, int)):
+                logger.warning(
+                    "Input price is a float/int. Using the same price for prompt and completion tokens. Use a list/tuple if prompt and completion token prices are different."
+                )
+                price = (price, price)
+
+            total_usage = None
+            actual_usage = None
+
+            cache_client = None
+            if cache is not None:
+                # Use the cache object if provided.
+                cache_client = cache
+            elif cache_seed is not None:
+                # Legacy cache behavior, if cache_seed is given, use DiskCache.
+                cache_client = Cache.disk(cache_seed, LEGACY_CACHE_DIR)
+
+            log_cache_seed_value(cache if cache is not None else cache_seed, client=client)
+
+            if cache_client is not None:
+                with cache_client as cache:
+                    # Try to get the response from cache
+                    key = get_key(
+                        {
+                            **params,
+                            **{"response_format": json.dumps(TypeAdapter(params["response_format"]).json_schema())},
+                        }
+                        if "response_format" in params and not isinstance(params["response_format"], dict)
+                        else params
+                    )
+                    request_ts = get_current_ts()
+
+                    response: ModelClient.ModelClientResponseProtocol = cache.get(key, None)
+
+                    if response is not None:
+                        response.message_retrieval_function = client.message_retrieval
+                        try:
+                            response.cost  # type: ignore [attr-defined]
+                        except AttributeError:
+                            # update attribute if cost is not calculated
+                            response.cost = client.cost(response)
+                            cache.set(key, response)
+                        total_usage = client.get_usage(response)
+
+                        if logging_enabled():
+                            # Log the cache hit
+                            # TODO: log the config_id and pass_filter etc.
+                            log_chat_completion(
+                                invocation_id=invocation_id,
+                                client_id=id(client),
+                                wrapper_id=id(self),
+                                agent=agent,
+                                request=params,
+                                response=response,
+                                is_cached=1,
+                                cost=response.cost,
+                                start_time=request_ts,
+                            )
+
+                        # check the filter
+                        pass_filter = filter_func is None or filter_func(context=context, response=response)
+                        if pass_filter or i == last:
+                            # Return the response if it passes the filter or it is the last client
+                            response.config_id = i
+                            response.pass_filter = pass_filter
+                            self._update_usage(actual_usage=actual_usage, total_usage=total_usage)
+                            return response
+                        continue  # filter is not passed; try the next config
+            try:
+                request_ts = get_current_ts()
+                response = client.create(params)
+            except Exception as e:
+                if openai_result.is_successful:
+                    if APITimeoutError is not None and isinstance(e, APITimeoutError):
+                        # logger.debug(f"config {i} timed out", exc_info=True)
+                        if i == last:
+                            raise TimeoutError(
+                                "OpenAI API call timed out. This could be due to congestion or too small a timeout value. The timeout can be specified by setting the 'timeout' value (in seconds) in the llm_config (if you are using agents) or the OpenAIWrapper constructor (if you are using the OpenAIWrapper directly)."
+                            ) from e
+                    elif APIError is not None and isinstance(e, APIError):
+                        error_code = getattr(e, "code", None)
+                        if logging_enabled():
+                            log_chat_completion(
+                                invocation_id=invocation_id,
+                                client_id=id(client),
+                                wrapper_id=id(self),
+                                agent=agent,
+                                request=params,
+                                response=f"error_code:{error_code}, config {i} failed",
+                                is_cached=0,
+                                cost=0,
+                                start_time=request_ts,
+                            )
+
+                        if error_code == "content_filter":
+                            # raise the error for content_filter
+                            raise
+                        # logger.debug(f"config {i} failed", exc_info=True)
+                        if i == last:
+                            raise
+                    else:
+                        raise
+                else:
+                    raise
+            except (
+                gemini_InternalServerError,
+                gemini_ResourceExhausted,
+                anthorpic_InternalServerError,
+                anthorpic_RateLimitError,
+                mistral_SDKError,
+                mistral_HTTPValidationError,
+                together_TogetherException,
+                groq_InternalServerError,
+                groq_RateLimitError,
+                groq_APIConnectionError,
+                cohere_InternalServerError,
+                cohere_TooManyRequestsError,
+                cohere_ServiceUnavailableError,
+                ollama_RequestError,
+                ollama_ResponseError,
+                bedrock_BotoCoreError,
+                bedrock_ClientError,
+                cerebras_AuthenticationError,
+                cerebras_InternalServerError,
+                cerebras_RateLimitError,
+            ):
+                # logger.debug(f"config {i} failed", exc_info=True)
+                if i == last:
+                    raise
+            else:
+                # add cost calculation before caching no matter filter is passed or not
+                if price is not None:
+                    response.cost = self._cost_with_customized_price(response, price)
+                else:
+                    response.cost = client.cost(response)
+                actual_usage = client.get_usage(response)
+                total_usage = actual_usage.copy() if actual_usage is not None else total_usage
+                self._update_usage(actual_usage=actual_usage, total_usage=total_usage)
+
+                if cache_client is not None:
+                    # Cache the response
+                    with cache_client as cache:
+                        cache.set(key, response)
+
+                if logging_enabled():
+                    # TODO: log the config_id and pass_filter etc.
+                    log_chat_completion(
+                        invocation_id=invocation_id,
+                        client_id=id(client),
+                        wrapper_id=id(self),
+                        agent=agent,
+                        request=params,
+                        response=response,
+                        is_cached=0,
+                        cost=response.cost,
+                        start_time=request_ts,
+                    )
+
+                response.message_retrieval_function = client.message_retrieval
+                # check the filter
+                pass_filter = filter_func is None or filter_func(context=context, response=response)
+                if pass_filter or i == last:
+                    # Return the response if it passes the filter or it is the last client
+                    response.config_id = i
+                    response.pass_filter = pass_filter
+                    return response
+                continue  # filter is not passed; try the next config
+        raise RuntimeError("Should not reach here.")
+
+    @staticmethod
+    def _cost_with_customized_price(
+        response: ModelClient.ModelClientResponseProtocol, price_1k: tuple[float, float]
+    ) -> None:
+        """If a customized cost is passed, overwrite the cost in the response."""
+        n_input_tokens = response.usage.prompt_tokens if response.usage is not None else 0  # type: ignore [union-attr]
+        n_output_tokens = response.usage.completion_tokens if response.usage is not None else 0  # type: ignore [union-attr]
+        if n_output_tokens is None:
+            n_output_tokens = 0
+        return (n_input_tokens * price_1k[0] + n_output_tokens * price_1k[1]) / 1000
+
+    @staticmethod
+    def _update_dict_from_chunk(chunk: BaseModel, d: dict[str, Any], field: str) -> int:
+        """Update the dict from the chunk.
+
+        Reads `chunk.field` and if present updates `d[field]` accordingly.
+
+        Args:
+            chunk: The chunk.
+            d: The dict to be updated in place.
+            field: The field.
+
+        Returns:
+            The updated dict.
+
+        """
+        completion_tokens = 0
+        assert isinstance(d, dict), d
+        if hasattr(chunk, field) and getattr(chunk, field) is not None:
+            new_value = getattr(chunk, field)
+            if isinstance(new_value, (list, dict)):
+                raise NotImplementedError(
+                    f"Field {field} is a list or dict, which is currently not supported. "
+                    "Only string and numbers are supported."
+                )
+            if field not in d:
+                d[field] = ""
+            if isinstance(new_value, str):
+                d[field] += getattr(chunk, field)
+            else:
+                d[field] = new_value
+            completion_tokens = 1
+
+        return completion_tokens
+
+    @staticmethod
+    def _update_function_call_from_chunk(
+        function_call_chunk: Union[ChoiceDeltaToolCallFunction, ChoiceDeltaFunctionCall],
+        full_function_call: Optional[dict[str, Any]],
+        completion_tokens: int,
+    ) -> tuple[dict[str, Any], int]:
+        """Update the function call from the chunk.
+
+        Args:
+            function_call_chunk: The function call chunk.
+            full_function_call: The full function call.
+            completion_tokens: The number of completion tokens.
+
+        Returns:
+            The updated full function call and the updated number of completion tokens.
+
+        """
+        # Handle function call
+        if function_call_chunk:
+            if full_function_call is None:
+                full_function_call = {}
+            for field in ["name", "arguments"]:
+                completion_tokens += OpenAIWrapper._update_dict_from_chunk(
+                    function_call_chunk, full_function_call, field
+                )
+
+        if full_function_call:
+            return full_function_call, completion_tokens
+        else:
+            raise RuntimeError("Function call is not found, this should not happen.")
+
+    @staticmethod
+    def _update_tool_calls_from_chunk(
+        tool_calls_chunk: ChoiceDeltaToolCall,
+        full_tool_call: Optional[dict[str, Any]],
+        completion_tokens: int,
+    ) -> tuple[dict[str, Any], int]:
+        """Update the tool call from the chunk.
+
+        Args:
+            tool_calls_chunk: The tool call chunk.
+            full_tool_call: The full tool call.
+            completion_tokens: The number of completion tokens.
+
+        Returns:
+            The updated full tool call and the updated number of completion tokens.
+
+        """
+        # future proofing for when tool calls other than function calls are supported
+        if tool_calls_chunk.type and tool_calls_chunk.type != "function":
+            raise NotImplementedError(
+                f"Tool call type {tool_calls_chunk.type} is currently not supported. Only function calls are supported."
+            )
+
+        # Handle tool call
+        assert full_tool_call is None or isinstance(full_tool_call, dict), full_tool_call
+        if tool_calls_chunk:
+            if full_tool_call is None:
+                full_tool_call = {}
+            for field in ["index", "id", "type"]:
+                completion_tokens += OpenAIWrapper._update_dict_from_chunk(tool_calls_chunk, full_tool_call, field)
+
+            if hasattr(tool_calls_chunk, "function") and tool_calls_chunk.function:
+                if "function" not in full_tool_call:
+                    full_tool_call["function"] = None
+
+                full_tool_call["function"], completion_tokens = OpenAIWrapper._update_function_call_from_chunk(
+                    tool_calls_chunk.function, full_tool_call["function"], completion_tokens
+                )
+
+        if full_tool_call:
+            return full_tool_call, completion_tokens
+        else:
+            raise RuntimeError("Tool call is not found, this should not happen.")
+
+    def _update_usage(self, actual_usage, total_usage):
+        def update_usage(usage_summary, response_usage):
+            # go through RESPONSE_USAGE_KEYS and check that they are in response_usage and if not just return usage_summary
+            for key in ModelClient.RESPONSE_USAGE_KEYS:
+                if key not in response_usage:
+                    return usage_summary
+
+            model = response_usage["model"]
+            cost = response_usage["cost"]
+            prompt_tokens = response_usage["prompt_tokens"]
+            completion_tokens = response_usage["completion_tokens"]
+            if completion_tokens is None:
+                completion_tokens = 0
+            total_tokens = response_usage["total_tokens"]
+
+            if usage_summary is None:
+                usage_summary = {"total_cost": cost}
+            else:
+                usage_summary["total_cost"] += cost
+
+            usage_summary[model] = {
+                "cost": usage_summary.get(model, {}).get("cost", 0) + cost,
+                "prompt_tokens": usage_summary.get(model, {}).get("prompt_tokens", 0) + prompt_tokens,
+                "completion_tokens": usage_summary.get(model, {}).get("completion_tokens", 0) + completion_tokens,
+                "total_tokens": usage_summary.get(model, {}).get("total_tokens", 0) + total_tokens,
+            }
+            return usage_summary
+
+        if total_usage is not None:
+            self.total_usage_summary = update_usage(self.total_usage_summary, total_usage)
+        if actual_usage is not None:
+            self.actual_usage_summary = update_usage(self.actual_usage_summary, actual_usage)
+
+    def print_usage_summary(self, mode: Union[str, list[str]] = ["actual", "total"]) -> None:
+        """Print the usage summary."""
+        iostream = IOStream.get_default()
+
+        if isinstance(mode, list):
+            if len(mode) == 0 or len(mode) > 2:
+                raise ValueError(f'Invalid mode: {mode}, choose from "actual", "total", ["actual", "total"]')
+            if "actual" in mode and "total" in mode:
+                mode = "both"
+            elif "actual" in mode:
+                mode = "actual"
+            elif "total" in mode:
+                mode = "total"
+
+        iostream.send(
+            UsageSummaryEvent(
+                actual_usage_summary=self.actual_usage_summary, total_usage_summary=self.total_usage_summary, mode=mode
+            )
+        )
+
+    def clear_usage_summary(self) -> None:
+        """Clear the usage summary."""
+        self.total_usage_summary = None
+        self.actual_usage_summary = None
+
+    @classmethod
+    def extract_text_or_completion_object(
+        cls, response: ModelClient.ModelClientResponseProtocol
+    ) -> Union[list[str], list[ModelClient.ModelClientResponseProtocol.Choice.Message]]:
+        """Extract the text or ChatCompletion objects from a completion or chat response.
+
+        Args:
+            response (ChatCompletion | Completion): The response from openai.
+
+        Returns:
+            A list of text, or a list of ChatCompletion objects if function_call/tool_calls are present.
+        """
+        return response.message_retrieval_function(response)
diff --git a/mm_agents/coact/autogen/oai/client_utils.py b/mm_agents/coact/autogen/oai/client_utils.py
new file mode 100644
index 0000000..d4d2c89
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/client_utils.py
@@ -0,0 +1,169 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Utilities for client classes"""
+
+import logging
+import warnings
+from typing import Any, Optional, Protocol, runtime_checkable
+
+
+@runtime_checkable
+class FormatterProtocol(Protocol):
+    """Structured Output classes with a format method"""
+
+    def format(self) -> str: ...
+
+
+def validate_parameter(
+    params: dict[str, Any],
+    param_name: str,
+    allowed_types: tuple[Any, ...],
+    allow_None: bool,  # noqa: N803
+    default_value: Any,
+    numerical_bound: Optional[tuple[Optional[float], Optional[float]]],
+    allowed_values: Optional[list[Any]],
+) -> Any:
+    """Validates a given config parameter, checking its type, values, and setting defaults
+    Parameters:
+        params (Dict[str, Any]): Dictionary containing parameters to validate.
+        param_name (str): The name of the parameter to validate.
+        allowed_types (Tuple): Tuple of acceptable types for the parameter.
+        allow_None (bool): Whether the parameter can be `None`.
+        default_value (Any): The default value to use if the parameter is invalid or missing.
+        numerical_bound (Optional[Tuple[Optional[float], Optional[float]]]):
+            A tuple specifying the lower and upper bounds for numerical parameters.
+            Each bound can be `None` if not applicable.
+        allowed_values (Optional[List[Any]]): A list of acceptable values for the parameter.
+            Can be `None` if no specific values are required.
+
+    Returns:
+        Any: The validated parameter value or the default value if validation fails.
+
+    Raises:
+        TypeError: If `allowed_values` is provided but is not a list.
+
+    Example Usage:
+    ```python
+        # Validating a numerical parameter within specific bounds
+        params = {"temperature": 0.5, "safety_model": "Meta-Llama/Llama-Guard-7b"}
+        temperature = validate_parameter(params, "temperature", (int, float), True, 0.7, (0, 1), None)
+        # Result: 0.5
+
+        # Validating a parameter that can be one of a list of allowed values
+        model = validate_parameter(
+        params, "safety_model", str, True, None, None, ["Meta-Llama/Llama-Guard-7b", "Meta-Llama/Llama-Guard-13b"]
+        )
+        # If "safety_model" is missing or invalid in params, defaults to "default"
+    ```
+    """
+    if allowed_values is not None and not isinstance(allowed_values, list):
+        raise TypeError(f"allowed_values should be a list or None, got {type(allowed_values).__name__}")
+
+    param_value = params.get(param_name, default_value)
+    warning = ""
+
+    if param_value is None and allow_None:
+        pass
+    elif param_value is None:
+        if not allow_None:
+            warning = "cannot be None"
+    elif not isinstance(param_value, allowed_types):
+        # Check types and list possible types if invalid
+        if isinstance(allowed_types, tuple):
+            formatted_types = "(" + ", ".join(f"{t.__name__}" for t in allowed_types) + ")"
+        else:
+            formatted_types = f"{allowed_types.__name__}"
+        warning = f"must be of type {formatted_types}{' or None' if allow_None else ''}"
+    elif numerical_bound:
+        # Check the value fits in possible bounds
+        lower_bound, upper_bound = numerical_bound
+        if (lower_bound is not None and param_value < lower_bound) or (
+            upper_bound is not None and param_value > upper_bound
+        ):
+            warning = "has numerical bounds"
+            if lower_bound is not None:
+                warning += f", >= {lower_bound!s}"
+            if upper_bound is not None:
+                if lower_bound is not None:
+                    warning += " and"
+                warning += f" <= {upper_bound!s}"
+            if allow_None:
+                warning += ", or can be None"
+
+    elif allowed_values:  # noqa: SIM102
+        # Check if the value matches any allowed values
+        if not (allow_None and param_value is None) and param_value not in allowed_values:
+            warning = f"must be one of these values [{allowed_values}]{', or can be None' if allow_None else ''}"
+
+    # If we failed any checks, warn and set to default value
+    if warning:
+        warnings.warn(
+            f"Config error - {param_name} {warning}, defaulting to {default_value}.",
+            UserWarning,
+        )
+        param_value = default_value
+
+    return param_value
+
+
+def should_hide_tools(messages: list[dict[str, Any]], tools: list[dict[str, Any]], hide_tools_param: str) -> bool:
+    """Determines if tools should be hidden. This function is used to hide tools when they have been run, minimising the chance of the LLM choosing them when they shouldn't.
+    Parameters:
+        messages (List[Dict[str, Any]]): List of messages
+        tools (List[Dict[str, Any]]): List of tools
+        hide_tools_param (str): "hide_tools" parameter value. Can be "if_all_run" (hide tools if all tools have been run), "if_any_run" (hide tools if any of the tools have been run), "never" (never hide tools). Default is "never".
+
+    Returns:
+        bool: Indicates whether the tools should be excluded from the response create request
+
+    Example Usage:
+    ```python
+        # Validating a numerical parameter within specific bounds
+        messages = params.get("messages", [])
+        tools = params.get("tools", None)
+        hide_tools = should_hide_tools(messages, tools, params["hide_tools"])
+    """
+    if hide_tools_param == "never" or tools is None or len(tools) == 0:
+        return False
+    elif hide_tools_param == "if_any_run":
+        # Return True if any tool_call_id exists, indicating a tool call has been executed. False otherwise.
+        return any(["tool_call_id" in dictionary for dictionary in messages])
+    elif hide_tools_param == "if_all_run":
+        # Return True if all tools have been executed at least once. False otherwise.
+
+        # Get the list of tool names
+        check_tool_names = [item["function"]["name"] for item in tools]
+
+        # Prepare a list of tool call ids and related function names
+        tool_call_ids = {}
+
+        # Loop through the messages and check if the tools have been run, removing them as we go
+        for message in messages:
+            if "tool_calls" in message:
+                # Register the tool ids and the function names (there could be multiple tool calls)
+                for tool_call in message["tool_calls"]:
+                    tool_call_ids[tool_call["id"]] = tool_call["function"]["name"]
+            elif "tool_call_id" in message:
+                # Tool called, get the name of the function based on the id
+                tool_name_called = tool_call_ids[message["tool_call_id"]]
+
+                # If we had not yet called the tool, check and remove it to indicate we have
+                if tool_name_called in check_tool_names:
+                    check_tool_names.remove(tool_name_called)
+
+        # Return True if all tools have been called at least once (accounted for)
+        return len(check_tool_names) == 0
+    else:
+        raise TypeError(
+            f"hide_tools_param is not a valid value ['if_all_run','if_any_run','never'], got '{hide_tools_param}'"
+        )
+
+
+# Logging format (originally from FLAML)
+logging_formatter = logging.Formatter(
+    "[%(name)s: %(asctime)s] {%(lineno)d} %(levelname)s - %(message)s", "%m-%d %H:%M:%S"
+)
diff --git a/mm_agents/coact/autogen/oai/cohere.py b/mm_agents/coact/autogen/oai/cohere.py
new file mode 100644
index 0000000..0fa54c8
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/cohere.py
@@ -0,0 +1,479 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Cohere's API.
+
+Example:
+    ```python
+    llm_config={
+        "config_list": [{
+            "api_type": "cohere",
+            "model": "command-r-plus",
+            "api_key": os.environ.get("COHERE_API_KEY")
+            "client_name": "autogen-cohere", # Optional parameter
+            }
+    ]}
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Cohere's python library using: pip install --upgrade cohere
+
+Resources:
+- https://docs.cohere.com/reference/chat
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import os
+import sys
+import time
+import warnings
+from typing import Any, Literal, Optional, Type
+
+from pydantic import BaseModel, Field
+
+from autogen.oai.client_utils import FormatterProtocol, logging_formatter, validate_parameter
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    from cohere import ClientV2 as CohereV2
+    from cohere.types import ToolResult
+
+logger = logging.getLogger(__name__)
+if not logger.handlers:
+    # Add the console handler.
+    _ch = logging.StreamHandler(stream=sys.stdout)
+    _ch.setFormatter(logging_formatter)
+    logger.addHandler(_ch)
+
+
+COHERE_PRICING_1K = {
+    "command-r-plus": (0.003, 0.015),
+    "command-r": (0.0005, 0.0015),
+    "command-nightly": (0.00025, 0.00125),
+    "command": (0.015, 0.075),
+    "command-light": (0.008, 0.024),
+    "command-light-nightly": (0.008, 0.024),
+}
+
+
+@register_llm_config
+class CohereLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["cohere"] = "cohere"
+    temperature: float = Field(default=0.3, ge=0)
+    max_tokens: Optional[int] = Field(default=None, ge=0)
+    k: int = Field(default=0, ge=0, le=500)
+    p: float = Field(default=0.75, ge=0.01, le=0.99)
+    seed: Optional[int] = None
+    frequency_penalty: float = Field(default=0, ge=0, le=1)
+    presence_penalty: float = Field(default=0, ge=0, le=1)
+    client_name: Optional[str] = None
+    strict_tools: bool = False
+    stream: bool = False
+    tool_choice: Optional[Literal["NONE", "REQUIRED"]] = None
+
+    def create_client(self):
+        raise NotImplementedError("CohereLLMConfigEntry.create_client is not implemented.")
+
+
+class CohereClient:
+    """Client for Cohere's API."""
+
+    def __init__(self, **kwargs):
+        """Requires api_key or environment variable to be set
+
+        Args:
+            **kwargs: The keyword arguments to pass to the Cohere API.
+        """
+        # Ensure we have the api_key upon instantiation
+        self.api_key = kwargs.get("api_key")
+        if not self.api_key:
+            self.api_key = os.getenv("COHERE_API_KEY")
+
+        assert self.api_key, (
+            "Please include the api_key in your config list entry for Cohere or set the COHERE_API_KEY env variable."
+        )
+
+        # Store the response format, if provided (for structured outputs)
+        self._response_format: Optional[Type[BaseModel]] = None
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Cohere API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        cohere_params = {}
+
+        # Check that we have what we need to use Cohere's API
+        # We won't enforce the available models as they are likely to change
+        cohere_params["model"] = params.get("model")
+        assert cohere_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Cohere model to use."
+        )
+
+        # Handle structured output response format from Pydantic model
+        if "response_format" in params and params["response_format"] is not None:
+            self._response_format = params.get("response_format")
+
+            response_format = params["response_format"]
+
+            # Check if it's a Pydantic model
+            if hasattr(response_format, "model_json_schema"):
+                # Get the JSON schema from the Pydantic model
+                schema = response_format.model_json_schema()
+
+                def resolve_ref(ref: str, defs: dict) -> dict:
+                    """Resolve a $ref to its actual schema definition"""
+                    # Extract the definition name from "#/$defs/Name"
+                    def_name = ref.split("/")[-1]
+                    return defs[def_name]
+
+                def ensure_type_fields(obj: dict, defs: dict) -> dict:
+                    """Recursively ensure all objects in the schema have a type and properties field"""
+                    if isinstance(obj, dict):
+                        # If it has a $ref, replace it with the actual definition
+                        if "$ref" in obj:
+                            ref_def = resolve_ref(obj["$ref"], defs)
+                            # Merge the reference definition with any existing fields
+                            obj = {**ref_def, **obj}
+                            # Remove the $ref as we've replaced it
+                            del obj["$ref"]
+
+                        # Process each value recursively
+                        return {
+                            k: ensure_type_fields(v, defs) if isinstance(v, (dict, list)) else v for k, v in obj.items()
+                        }
+                    elif isinstance(obj, list):
+                        return [ensure_type_fields(item, defs) for item in obj]
+                    return obj
+
+                # Make a copy of $defs before processing
+                defs = schema.get("$defs", {})
+
+                # Process the schema
+                processed_schema = ensure_type_fields(schema, defs)
+
+                cohere_params["response_format"] = {"type": "json_object", "json_schema": processed_schema}
+            else:
+                raise ValueError("response_format must be a Pydantic BaseModel")
+
+        # Handle strict tools parameter for structured outputs with tools
+        if "tools" in params:
+            cohere_params["strict_tools"] = validate_parameter(params, "strict_tools", bool, False, False, None, None)
+
+        # Validate allowed Cohere parameters
+        # https://docs.cohere.com/reference/chat
+        if "temperature" in params:
+            cohere_params["temperature"] = validate_parameter(
+                params, "temperature", (int, float), False, 0.3, (0, None), None
+            )
+
+        if "max_tokens" in params:
+            cohere_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, None, (0, None), None)
+
+        if "k" in params:
+            cohere_params["k"] = validate_parameter(params, "k", int, False, 0, (0, 500), None)
+
+        if "p" in params:
+            cohere_params["p"] = validate_parameter(params, "p", (int, float), False, 0.75, (0.01, 0.99), None)
+
+        if "seed" in params:
+            cohere_params["seed"] = validate_parameter(params, "seed", int, True, None, None, None)
+
+        if "frequency_penalty" in params:
+            cohere_params["frequency_penalty"] = validate_parameter(
+                params, "frequency_penalty", (int, float), True, 0, (0, 1), None
+            )
+
+        if "presence_penalty" in params:
+            cohere_params["presence_penalty"] = validate_parameter(
+                params, "presence_penalty", (int, float), True, 0, (0, 1), None
+            )
+
+        if "tool_choice" in params:
+            cohere_params["tool_choice"] = validate_parameter(
+                params, "tool_choice", str, True, None, None, ["NONE", "REQUIRED"]
+            )
+
+        return cohere_params
+
+    @require_optional_import("cohere", "cohere")
+    def create(self, params: dict) -> ChatCompletion:
+        messages = params.get("messages", [])
+        client_name = params.get("client_name") or "AG2"
+        cohere_tool_names = set()
+        tool_calls_modified_ids = set()
+
+        # Parse parameters to the Cohere API's parameters
+        cohere_params = self.parse_params(params)
+
+        cohere_params["messages"] = messages
+
+        if "tools" in params:
+            cohere_tool_names = set([tool["function"]["name"] for tool in params["tools"]])
+            cohere_params["tools"] = params["tools"]
+
+        # Strip out name
+        for message in cohere_params["messages"]:
+            message_name = message.pop("name", "")
+            # Extract and prepend name to content or tool_plan if available
+            message["content"] = (
+                f"{message_name}: {(message.get('content') or message.get('tool_plan'))}"
+                if message_name
+                else (message.get("content") or message.get("tool_plan"))
+            )
+
+            # Handle tool calls
+            if message.get("tool_calls") is not None and len(message["tool_calls"]) > 0:
+                message["tool_plan"] = message.get("tool_plan", message["content"])
+                del message["content"]  # Remove content as tool_plan is prioritized
+
+                # If tool call name is missing or not recognized, modify role and content
+                for tool_call in message["tool_calls"] or []:
+                    if (not tool_call.get("function", {}).get("name")) or tool_call.get("function", {}).get(
+                        "name"
+                    ) not in cohere_tool_names:
+                        message["role"] = "assistant"
+                        message["content"] = f"{message.pop('tool_plan', '')}{str(message['tool_calls'])}"
+                        tool_calls_modified_ids = tool_calls_modified_ids.union(
+                            set([tool_call.get("id") for tool_call in message["tool_calls"]])
+                        )
+                        del message["tool_calls"]
+                        break
+
+            # Adjust role if message comes from a tool with a modified ID
+            if message.get("role") == "tool":
+                tool_id = message.get("tool_call_id")
+                if tool_id in tool_calls_modified_ids:
+                    message["role"] = "user"
+                    del message["tool_call_id"]  # Remove the tool call ID
+
+        # We use chat model by default
+        client = CohereV2(api_key=self.api_key, client_name=client_name)
+
+        # Token counts will be returned
+        prompt_tokens = 0
+        completion_tokens = 0
+        total_tokens = 0
+
+        # Stream if in parameters
+        streaming = params.get("stream")
+        cohere_finish = "stop"
+        tool_calls = None
+        ans = None
+        if streaming:
+            response = client.chat_stream(**cohere_params)
+            # Streaming...
+            ans = ""
+            plan = ""
+            prompt_tokens = 0
+            completion_tokens = 0
+            for chunk in response:
+                if chunk.type == "content-delta":
+                    ans = ans + chunk.delta.message.content.text
+                elif chunk.type == "tool-plan-delta":
+                    plan = plan + chunk.delta.message.tool_plan
+                elif chunk.type == "tool-call-start":
+                    cohere_finish = "tool_calls"
+
+                    # Initialize a new tool call
+                    tool_call = chunk.delta.message.tool_calls
+                    current_tool = {
+                        "id": tool_call.id,
+                        "type": "function",
+                        "function": {"name": tool_call.function.name, "arguments": ""},
+                    }
+                elif chunk.type == "tool-call-delta":
+                    # Progressively build the arguments as they stream in
+                    if current_tool is not None:
+                        current_tool["function"]["arguments"] += chunk.delta.message.tool_calls.function.arguments
+                elif chunk.type == "tool-call-end":
+                    # Append the finished tool call to the list
+                    if current_tool is not None:
+                        if tool_calls is None:
+                            tool_calls = []
+                        tool_calls.append(ChatCompletionMessageToolCall(**current_tool))
+                        current_tool = None
+                elif chunk.type == "message-start":
+                    response_id = chunk.id
+                elif chunk.type == "message-end":
+                    prompt_tokens = (
+                        chunk.delta.usage.billed_units.input_tokens
+                    )  # Note total (billed+non-billed) available with ...usage.tokens...
+                    completion_tokens = chunk.delta.usage.billed_units.output_tokens
+
+            total_tokens = prompt_tokens + completion_tokens
+        else:
+            response = client.chat(**cohere_params)
+
+            if response.message.tool_calls is not None:
+                ans = response.message.tool_plan
+                cohere_finish = "tool_calls"
+                tool_calls = []
+                for tool_call in response.message.tool_calls:
+                    # if parameters are null, clear them out (Cohere can return a string "null" if no parameter values)
+
+                    tool_calls.append(
+                        ChatCompletionMessageToolCall(
+                            id=tool_call.id,
+                            function={
+                                "name": tool_call.function.name,
+                                "arguments": (
+                                    "" if tool_call.function.arguments is None else tool_call.function.arguments
+                                ),
+                            },
+                            type="function",
+                        )
+                    )
+            else:
+                ans: str = response.message.content[0].text
+
+            # Not using billed_units, but that may be better for cost purposes
+            prompt_tokens = (
+                response.usage.billed_units.input_tokens
+            )  # Note total (billed+non-billed) available with ...usage.tokens...
+            completion_tokens = response.usage.billed_units.output_tokens
+            total_tokens = prompt_tokens + completion_tokens
+
+            response_id = response.id
+
+        # Clean up structured output if needed
+        if self._response_format:
+            # ans = clean_return_response_format(ans)
+            try:
+                parsed_response = self._convert_json_response(ans)
+                ans = _format_json_response(parsed_response, ans)
+            except ValueError as e:
+                ans = str(e)
+
+        # 3. convert output
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=ans,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=cohere_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response_id,
+            model=cohere_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=total_tokens,
+            ),
+            cost=calculate_cohere_cost(prompt_tokens, completion_tokens, cohere_params["model"]),
+        )
+
+        return response_oai
+
+    def _convert_json_response(self, response: str) -> Any:
+        """Extract and validate JSON response from the output for structured outputs.
+        Args:
+            response (str): The response from the API.
+        Returns:
+            Any: The parsed JSON response.
+        """
+        if not self._response_format:
+            return response
+
+        try:
+            # Parse JSON and validate against the Pydantic model
+            json_data = json.loads(response)
+            return self._response_format.model_validate(json_data)
+        except Exception as e:
+            raise ValueError(
+                f"Failed to parse response as valid JSON matching the schema for Structured Output: {str(e)}"
+            )
+
+
+def _format_json_response(response: Any, original_answer: str) -> str:
+    """Formats the JSON response for structured outputs using the format method if it exists."""
+    return (
+        response.format() if isinstance(response, FormatterProtocol) else clean_return_response_format(original_answer)
+    )
+
+
+def extract_to_cohere_tool_results(tool_call_id: str, content_output: str, all_tool_calls) -> list[dict[str, Any]]:
+    temp_tool_results = []
+
+    for tool_call in all_tool_calls:
+        if tool_call["id"] == tool_call_id:
+            call = {
+                "name": tool_call["function"]["name"],
+                "parameters": json.loads(
+                    tool_call["function"]["arguments"] if tool_call["function"]["arguments"] != "" else "{}"
+                ),
+            }
+            output = [{"value": content_output}]
+            temp_tool_results.append(ToolResult(call=call, outputs=output))
+    return temp_tool_results
+
+
+def calculate_cohere_cost(input_tokens: int, output_tokens: int, model: str) -> float:
+    """Calculate the cost of the completion using the Cohere pricing."""
+    total = 0.0
+
+    if model in COHERE_PRICING_1K:
+        input_cost_per_k, output_cost_per_k = COHERE_PRICING_1K[model]
+        input_cost = (input_tokens / 1000) * input_cost_per_k
+        output_cost = (output_tokens / 1000) * output_cost_per_k
+        total = input_cost + output_cost
+    else:
+        warnings.warn(f"Cost calculation not available for {model} model", UserWarning)
+
+    return total
+
+
+def clean_return_response_format(response_str: str) -> str:
+    """Clean up the response string by parsing through json library."""
+    # Parse the string to a JSON object to handle escapes
+    data = json.loads(response_str)
+
+    # Convert back to JSON string with minimal formatting
+    return json.dumps(data)
+
+
+class CohereError(Exception):
+    """Base class for other Cohere exceptions"""
+
+    pass
+
+
+class CohereRateLimitError(CohereError):
+    """Raised when rate limit is exceeded"""
+
+    pass
diff --git a/mm_agents/coact/autogen/oai/gemini.py b/mm_agents/coact/autogen/oai/gemini.py
new file mode 100644
index 0000000..f00c8d9
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/gemini.py
@@ -0,0 +1,1007 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create a OpenAI-compatible client for Gemini features.
+
+Example:
+    ```python
+    llm_config = {
+        "config_list": [
+            {
+                "api_type": "google",
+                "model": "gemini-pro",
+                "api_key": os.environ.get("GOOGLE_GEMINI_API_KEY"),
+                "safety_settings": [
+                    {"category": "HARM_CATEGORY_HARASSMENT", "threshold": "BLOCK_ONLY_HIGH"},
+                    {"category": "HARM_CATEGORY_HATE_SPEECH", "threshold": "BLOCK_ONLY_HIGH"},
+                    {"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT", "threshold": "BLOCK_ONLY_HIGH"},
+                    {"category": "HARM_CATEGORY_DANGEROUS_CONTENT", "threshold": "BLOCK_ONLY_HIGH"},
+                ],
+                "top_p": 0.5,
+                "max_tokens": 2048,
+                "temperature": 1.0,
+                "top_k": 5,
+            }
+        ]
+    }
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Resources:
+- https://ai.google.dev/docs
+- https://cloud.google.com/vertex-ai/generative-ai/docs/migrate/migrate-from-azure-to-gemini
+- https://blog.google/technology/ai/google-gemini-pro-imagen-duet-ai-update/
+- https://ai.google.dev/api/python/google/generativeai/ChatSession
+"""
+
+from __future__ import annotations
+
+import asyncio
+import base64
+import copy
+import json
+import logging
+import os
+import random
+import re
+import time
+import warnings
+from io import BytesIO
+from typing import Any, Literal, Optional, Type, Union
+
+import requests
+from packaging import version
+from pydantic import BaseModel, Field
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..json_utils import resolve_json_references
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import FormatterProtocol
+from .gemini_types import ToolConfig
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    import google.genai as genai
+    import vertexai
+    from PIL import Image
+    from google.auth.credentials import Credentials
+    from google.genai.types import (
+        Content,
+        FinishReason,
+        FunctionCall,
+        FunctionDeclaration,
+        FunctionResponse,
+        GenerateContentConfig,
+        GenerateContentResponse,
+        GoogleSearch,
+        Part,
+        Schema,
+        Tool,
+        Type,
+    )
+    from jsonschema import ValidationError
+    from vertexai.generative_models import Content as VertexAIContent
+    from vertexai.generative_models import FunctionDeclaration as vaiFunctionDeclaration
+    from vertexai.generative_models import GenerationConfig, GenerativeModel
+    from vertexai.generative_models import (
+        GenerationResponse as VertexAIGenerationResponse,
+    )
+    from vertexai.generative_models import HarmBlockThreshold as VertexAIHarmBlockThreshold
+    from vertexai.generative_models import HarmCategory as VertexAIHarmCategory
+    from vertexai.generative_models import Part as VertexAIPart
+    from vertexai.generative_models import SafetySetting as VertexAISafetySetting
+    from vertexai.generative_models import (
+        Tool as vaiTool,
+    )
+
+logger = logging.getLogger(__name__)
+
+
+@register_llm_config
+class GeminiLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["google"] = "google"
+    project_id: Optional[str] = None
+    location: Optional[str] = None
+    # google_application_credentials points to the path of the JSON Keyfile
+    google_application_credentials: Optional[str] = None
+    # credentials is a google.auth.credentials.Credentials object
+    credentials: Optional[Union[Any, str]] = None
+    stream: bool = False
+    safety_settings: Optional[Union[list[dict[str, Any]], dict[str, Any]]] = None
+    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
+    tool_config: Optional[ToolConfig] = None
+
+    def create_client(self):
+        raise NotImplementedError("GeminiLLMConfigEntry.create_client() is not implemented.")
+
+
+@require_optional_import(["google", "vertexai", "PIL", "jsonschema"], "gemini")
+class GeminiClient:
+    """Client for Google's Gemini API."""
+
+    # Mapping, where Key is a term used by Autogen, and Value is a term used by Gemini
+    PARAMS_MAPPING = {
+        "max_tokens": "max_output_tokens",
+        # "n": "candidate_count", # Gemini supports only `n=1`
+        "stop_sequences": "stop_sequences",
+        "temperature": "temperature",
+        "top_p": "top_p",
+        "top_k": "top_k",
+        "max_output_tokens": "max_output_tokens",
+    }
+
+    def _initialize_vertexai(self, **params):
+        if "google_application_credentials" in params:
+            # Path to JSON Keyfile
+            os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = params["google_application_credentials"]
+        vertexai_init_args = {}
+        if "project_id" in params:
+            vertexai_init_args["project"] = params["project_id"]
+        if "location" in params:
+            vertexai_init_args["location"] = params["location"]
+        if "credentials" in params:
+            assert isinstance(params["credentials"], Credentials), (
+                "Object type google.auth.credentials.Credentials is expected!"
+            )
+            vertexai_init_args["credentials"] = params["credentials"]
+        if vertexai_init_args:
+            vertexai.init(**vertexai_init_args)
+
+    def __init__(self, **kwargs):
+        """Uses either either api_key for authentication from the LLM config
+        (specifying the GOOGLE_GEMINI_API_KEY environment variable also works),
+        or follows the Google authentication mechanism for VertexAI in Google Cloud if no api_key is specified,
+        where project_id and location can also be passed as parameters. Previously created credentials object can be provided,
+        or a Service account key file can also be used. If neither a service account key file, nor the api_key are passed,
+        then the default credentials will be used, which could be a personal account if the user is already authenticated in,
+        like in Google Cloud Shell.
+
+        Args:
+            **kwargs: The keyword arguments to initialize the Gemini client.
+        """
+        self.api_key = kwargs.get("api_key")
+        if not self.api_key:
+            self.api_key = os.getenv("GOOGLE_GEMINI_API_KEY")
+            if self.api_key is None:
+                self.use_vertexai = True
+                self._initialize_vertexai(**kwargs)
+            else:
+                self.use_vertexai = False
+        else:
+            self.use_vertexai = False
+        if not self.use_vertexai:
+            assert ("project_id" not in kwargs) and ("location" not in kwargs), (
+                "Google Cloud project and compute location cannot be set when using an API Key!"
+            )
+
+        self.api_version = kwargs.get("api_version")
+
+        # Store the response format, if provided (for structured outputs)
+        self._response_format: Optional[type[BaseModel]] = None
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def create(self, params: dict) -> ChatCompletion:
+        # When running in async context via run_in_executor from ConversableAgent.a_generate_oai_reply,
+        # this method runs in a new thread that doesn't have an event loop by default. The Google Genai
+        # client requires an event loop even for synchronous operations, so we need to ensure one exists.
+        try:
+            asyncio.get_running_loop()
+        except RuntimeError:
+            # No event loop exists in this thread (which happens when called from an executor)
+            # Create a new event loop for this thread to satisfy Genai client requirements
+            loop = asyncio.new_event_loop()
+            asyncio.set_event_loop(loop)
+
+        if self.use_vertexai:
+            self._initialize_vertexai(**params)
+        else:
+            assert ("project_id" not in params) and ("location" not in params), (
+                "Google Cloud project and compute location cannot be set when using an API Key!"
+            )
+        model_name = params.get("model", "gemini-pro")
+
+        if model_name == "gemini-pro-vision":
+            raise ValueError(
+                "Gemini 1.0 Pro vision ('gemini-pro-vision') has been deprecated, please consider switching to a different model, for example 'gemini-1.5-flash'."
+            )
+        elif not model_name:
+            raise ValueError(
+                "Please provide a model name for the Gemini Client. "
+                "You can configure it in the OAI Config List file. "
+                "See this [LLM configuration tutorial](https://docs.ag2.ai/latest/docs/user-guide/basic-concepts/llm-configuration/) for more details."
+            )
+
+        params.get("api_type", "google")  # not used
+        http_options = {"api_version": self.api_version} if self.api_version else None
+        messages = params.get("messages", [])
+        stream = params.get("stream", False)
+        n_response = params.get("n", 1)
+        system_instruction = self._extract_system_instruction(messages)
+        response_validation = params.get("response_validation", True)
+        tools = self._tools_to_gemini_tools(params["tools"]) if "tools" in params else None
+        tool_config = params.get("tool_config")
+
+        generation_config = {
+            gemini_term: params[autogen_term]
+            for autogen_term, gemini_term in self.PARAMS_MAPPING.items()
+            if autogen_term in params
+        }
+        if self.use_vertexai:
+            safety_settings = GeminiClient._to_vertexai_safety_settings(params.get("safety_settings", []))
+        else:
+            safety_settings = params.get("safety_settings", [])
+
+        if stream:
+            warnings.warn(
+                "Streaming is not supported for Gemini yet, and it will have no effect. Please set stream=False.",
+                UserWarning,
+            )
+            stream = False
+
+        if n_response > 1:
+            warnings.warn("Gemini only supports `n=1` for now. We only generate one response.", UserWarning)
+
+        autogen_tool_calls = []
+
+        # Maps the function call ids to function names so we can inject it into FunctionResponse messages
+        self.tool_call_function_map: dict[str, str] = {}
+
+        # If response_format exists, we want structured outputs
+        # Based on
+        # https://ai.google.dev/gemini-api/docs/structured-output?lang=python#supply-schema-in-config
+        if params.get("response_format"):
+            self._response_format = params.get("response_format")
+            generation_config["response_mime_type"] = "application/json"
+
+            response_format_schema_raw = params.get("response_format")
+
+            if isinstance(response_format_schema_raw, dict):
+                response_schema = resolve_json_references(response_format_schema_raw)
+            else:
+                response_schema = resolve_json_references(params.get("response_format").model_json_schema())
+            if "$defs" in response_schema:
+                response_schema.pop("$defs")
+            generation_config["response_schema"] = response_schema
+
+        # A. create and call the chat model.
+        gemini_messages = self._oai_messages_to_gemini_messages(messages)
+        if self.use_vertexai:
+            model = GenerativeModel(
+                model_name,
+                generation_config=GenerationConfig(**generation_config),
+                safety_settings=safety_settings,
+                system_instruction=system_instruction,
+                tool_config=tool_config,
+                tools=tools,
+            )
+
+            chat = model.start_chat(history=gemini_messages[:-1], response_validation=response_validation)
+            response = chat.send_message(gemini_messages[-1].parts, stream=stream, safety_settings=safety_settings)
+        else:
+            client = genai.Client(api_key=self.api_key, http_options=http_options)
+            generate_content_config = GenerateContentConfig(
+                safety_settings=safety_settings,
+                system_instruction=system_instruction,
+                tools=tools,
+                tool_config=tool_config,
+                **generation_config,
+            )
+            chat = client.chats.create(model=model_name, config=generate_content_config, history=gemini_messages[:-1])
+            response = chat.send_message(message=gemini_messages[-1].parts)
+
+        # Extract text and tools from response
+        ans = ""
+        random_id = random.randint(0, 10000)
+        prev_function_calls = []
+        error_finish_reason = None
+
+        if isinstance(response, GenerateContentResponse):
+            if len(response.candidates) != 1:
+                raise ValueError(
+                    f"Unexpected number of candidates in the response. Expected 1, got {len(response.candidates)}"
+                )
+
+            # Look at https://cloud.google.com/vertex-ai/generative-ai/docs/reference/python/latest/vertexai.generative_models.FinishReason
+            if response.candidates[0].finish_reason and response.candidates[0].finish_reason == FinishReason.RECITATION:
+                recitation_part = Part(text="Unsuccessful Finish Reason: RECITATION")
+                parts = [recitation_part]
+                error_finish_reason = "content_filter"  # As per available finish_reason in Choice
+            else:
+                parts = response.candidates[0].content.parts
+        elif isinstance(response, VertexAIGenerationResponse):  # or hasattr(response, "candidates"):
+            # google.generativeai also raises an error len(candidates) != 1:
+            if len(response.candidates) != 1:
+                raise ValueError(
+                    f"Unexpected number of candidates in the response. Expected 1, got {len(response.candidates)}"
+                )
+            parts = response.candidates[0].content.parts
+        else:
+            raise ValueError(f"Unexpected response type: {type(response)}")
+
+        for part in parts:
+            # Function calls
+            if fn_call := part.function_call:
+                # If we have a repeated function call, ignore it
+                if fn_call not in prev_function_calls:
+                    autogen_tool_calls.append(
+                        ChatCompletionMessageToolCall(
+                            id=str(random_id),
+                            function={
+                                "name": fn_call.name,
+                                "arguments": (
+                                    json.dumps({key: val for key, val in fn_call.args.items()})
+                                    if fn_call.args is not None
+                                    else ""
+                                ),
+                            },
+                            type="function",
+                        )
+                    )
+
+                    prev_function_calls.append(fn_call)
+                    random_id += 1
+
+            # Plain text content
+            elif text := part.text:
+                ans += text
+
+        # If we have function calls, ignore the text
+        # as it can be Gemini guessing the function response
+        if len(autogen_tool_calls) != 0:
+            ans = ""
+        else:
+            autogen_tool_calls = None
+
+        if self._response_format and ans:
+            try:
+                parsed_response = self._convert_json_response(ans)
+                ans = _format_json_response(parsed_response, ans)
+            except ValueError as e:
+                ans = str(e)
+
+        # 3. convert output
+        message = ChatCompletionMessage(
+            role="assistant", content=ans, function_call=None, tool_calls=autogen_tool_calls
+        )
+        choices = [
+            Choice(
+                finish_reason="tool_calls"
+                if autogen_tool_calls is not None
+                else error_finish_reason
+                if error_finish_reason
+                else "stop",
+                index=0,
+                message=message,
+            )
+        ]
+
+        prompt_tokens = response.usage_metadata.prompt_token_count
+        completion_tokens = (
+            response.usage_metadata.candidates_token_count if response.usage_metadata.candidates_token_count else 0
+        )
+
+        response_oai = ChatCompletion(
+            id=str(random.randint(0, 1000)),
+            model=model_name,
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=prompt_tokens + completion_tokens,
+            ),
+            cost=calculate_gemini_cost(self.use_vertexai, prompt_tokens, completion_tokens, model_name),
+        )
+
+        return response_oai
+
+    def _extract_system_instruction(self, messages: list[dict]) -> str | None:
+        """Extract system instruction if provided."""
+        if messages is None or len(messages) == 0 or messages[0].get("role") != "system":
+            return None
+
+        message = messages.pop(0)
+        content = message["content"]
+
+        # Multi-model uses a list of dictionaries as content with text for the system message
+        # Otherwise normal agents will have strings as content
+        content = content[0].get("text", "").strip() if isinstance(content, list) else content.strip()
+
+        content = content if len(content) > 0 else None
+        return content
+
+    def _oai_content_to_gemini_content(self, message: dict[str, Any]) -> tuple[list[Any], str]:
+        """Convert AG2 content to Gemini parts, catering for text and tool calls"""
+        rst = []
+
+        if "role" in message and message["role"] == "tool":
+            # Tool call recommendation
+
+            function_name = self.tool_call_function_map[message["tool_call_id"]]
+
+            if self.use_vertexai:
+                rst.append(
+                    VertexAIPart.from_function_response(
+                        name=function_name, response={"result": self._to_json_or_str(message["content"])}
+                    )
+                )
+            else:
+                rst.append(
+                    Part(
+                        function_response=FunctionResponse(
+                            name=function_name, response={"result": self._to_json_or_str(message["content"])}
+                        )
+                    )
+                )
+
+            return rst, "tool"
+        elif "tool_calls" in message and len(message["tool_calls"]) != 0:
+            for tool_call in message["tool_calls"]:
+                function_id = tool_call["id"]
+                function_name = tool_call["function"]["name"]
+                self.tool_call_function_map[function_id] = function_name
+
+                if self.use_vertexai:
+                    rst.append(
+                        VertexAIPart.from_dict({
+                            "functionCall": {
+                                "name": function_name,
+                                "args": json.loads(tool_call["function"]["arguments"]),
+                            }
+                        })
+                    )
+                else:
+                    rst.append(
+                        Part(
+                            function_call=FunctionCall(
+                                name=function_name,
+                                args=json.loads(tool_call["function"]["arguments"]),
+                            )
+                        )
+                    )
+
+            return rst, "tool_call"
+
+        elif isinstance(message["content"], str):
+            content = message["content"]
+            if content == "":
+                content = "empty"  # Empty content is not allowed.
+            if self.use_vertexai:
+                rst.append(VertexAIPart.from_text(content))
+            else:
+                rst.append(Part(text=content))
+
+            return rst, "text"
+
+        # For images the message contains a list of text items
+        if isinstance(message["content"], list):
+            has_image = False
+            for msg in message["content"]:
+                if isinstance(msg, dict):
+                    assert "type" in msg, f"Missing 'type' field in message: {msg}"
+                    if msg["type"] == "text":
+                        if self.use_vertexai:
+                            rst.append(VertexAIPart.from_text(text=msg["text"]))
+                        else:
+                            rst.append(Part(text=msg["text"]))
+                    elif msg["type"] == "image_url":
+                        if self.use_vertexai:
+                            img_url = msg["image_url"]["url"]
+                            img_part = VertexAIPart.from_uri(img_url, mime_type="image/png")
+                            rst.append(img_part)
+                        else:
+                            b64_img = get_image_data(msg["image_url"]["url"])
+                            rst.append(Part(inline_data={"mime_type": "image/png", "data": b64_img}))
+
+                        has_image = True
+                    else:
+                        raise ValueError(f"Unsupported message type: {msg['type']}")
+                else:
+                    raise ValueError(f"Unsupported message type: {type(msg)}")
+            return rst, "image" if has_image else "text"
+        else:
+            raise Exception("Unable to convert content to Gemini format.")
+
+    def _concat_parts(self, parts: list[Part]) -> list:
+        """Concatenate parts with the same type.
+        If two adjacent parts both have the "text" attribute, then it will be joined into one part.
+        """
+        if not parts:
+            return []
+
+        concatenated_parts = []
+        previous_part = parts[0]
+
+        for current_part in parts[1:]:
+            if previous_part.text != "":
+                if self.use_vertexai:
+                    previous_part = VertexAIPart.from_text(previous_part.text + current_part.text)
+                else:
+                    previous_part.text += current_part.text
+            else:
+                concatenated_parts.append(previous_part)
+                previous_part = current_part
+
+        if previous_part.text == "":
+            if self.use_vertexai:
+                previous_part = VertexAIPart.from_text("empty")
+            else:
+                previous_part.text = "empty"  # Empty content is not allowed.
+        concatenated_parts.append(previous_part)
+
+        return concatenated_parts
+
+    def _oai_messages_to_gemini_messages(self, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        """Convert messages from OAI format to Gemini format.
+        Make sure the "user" role and "model" role are interleaved.
+        Also, make sure the last item is from the "user" role.
+        """
+        rst = []
+        for message in messages:
+            parts, part_type = self._oai_content_to_gemini_content(message)
+            role = "user" if message["role"] in ["user", "system"] else "model"
+
+            if part_type == "text":
+                rst.append(
+                    VertexAIContent(parts=parts, role=role)
+                    if self.use_vertexai
+                    else rst.append(Content(parts=parts, role=role))
+                )
+            elif part_type == "tool":
+                # Function responses should be assigned "model" role to keep them separate from function calls
+                role = "function" if version.parse(genai.__version__) < version.parse("1.4.0") else "model"
+                rst.append(
+                    VertexAIContent(parts=parts, role=role)
+                    if self.use_vertexai
+                    else rst.append(Content(parts=parts, role=role))
+                )
+            elif part_type == "tool_call":
+                # Function calls should be assigned "user" role
+                role = "function" if version.parse(genai.__version__) < version.parse("1.4.0") else "user"
+                rst.append(
+                    VertexAIContent(parts=parts, role=role)
+                    if self.use_vertexai
+                    else rst.append(Content(parts=parts, role=role))
+                )
+            elif part_type == "image":
+                # Image has multiple parts, some can be text and some can be image based
+                text_parts = []
+                image_parts = []
+                for part in parts:
+                    if isinstance(part, Part):
+                        # Text or non-Vertex AI image part
+                        text_parts.append(part)
+                    elif isinstance(part, VertexAIPart):
+                        # Image
+                        image_parts.append(part)
+                    else:
+                        raise Exception("Unable to process image part")
+
+                if len(text_parts) > 0:
+                    rst.append(
+                        VertexAIContent(parts=text_parts, role=role)
+                        if self.use_vertexai
+                        else rst.append(Content(parts=text_parts, role=role))
+                    )
+
+                if len(image_parts) > 0:
+                    rst.append(
+                        VertexAIContent(parts=image_parts, role=role)
+                        if self.use_vertexai
+                        else rst.append(Content(parts=image_parts, role=role))
+                    )
+
+            if len(rst) != 0 and rst[-1] is None:
+                rst.pop()
+
+        # The Gemini is restrict on order of roles, such that
+        # 1. The first message must be from the user role.
+        # 2. The last message must be from the user role.
+        # 3. The messages should be interleaved between user and model.
+        # We add a dummy message "start chat" if the first role is not the user.
+        # We add a dummy message "continue" if the last role is not the user.
+        if rst[0].role != "user":
+            text_part, _ = self._oai_content_to_gemini_content({"content": "start chat"})
+            rst.insert(
+                0,
+                VertexAIContent(parts=text_part, role="user")
+                if self.use_vertexai
+                else Content(parts=text_part, role="user"),
+            )
+
+        if rst[-1].role != "user":
+            text_part, _ = self._oai_content_to_gemini_content({"content": "continue"})
+            rst.append(
+                VertexAIContent(parts=text_part, role="user")
+                if self.use_vertexai
+                else Content(parts=text_part, role="user")
+            )
+
+        return rst
+
+    def _convert_json_response(self, response: str) -> Any:
+        """Extract and validate JSON response from the output for structured outputs.
+
+        Args:
+            response (str): The response from the API.
+
+        Returns:
+            Any: The parsed JSON response.
+        """
+        if not self._response_format:
+            return response
+
+        try:
+            # Parse JSON and validate against the Pydantic model if Pydantic model was provided
+            json_data = json.loads(response)
+            if isinstance(self._response_format, dict):
+                return json_data
+            else:
+                return self._response_format.model_validate(json_data)
+        except Exception as e:
+            raise ValueError(f"Failed to parse response as valid JSON matching the schema for Structured Output: {e!s}")
+
+    @staticmethod
+    def _convert_type_null_to_nullable(schema: Any) -> Any:
+        """
+        Recursively converts all occurrences of {"type": "null"} to {"nullable": True} in a schema.
+        """
+        if isinstance(schema, dict):
+            # If schema matches {"type": "null"}, replace it
+            if schema == {"type": "null"}:
+                return {"nullable": True}
+            # Otherwise, recursively process dictionary
+            return {key: GeminiClient._convert_type_null_to_nullable(value) for key, value in schema.items()}
+        elif isinstance(schema, list):
+            # Recursively process list elements
+            return [GeminiClient._convert_type_null_to_nullable(item) for item in schema]
+        return schema
+
+    @staticmethod
+    def _check_if_prebuilt_google_search_tool_exists(tools: list[dict[str, Any]]) -> bool:
+        """Check if the Google Search tool is present in the tools list."""
+        exists = False
+        for tool in tools:
+            if tool["function"]["name"] == "prebuilt_google_search":
+                exists = True
+                break
+
+        if exists and len(tools) > 1:
+            raise ValueError(
+                "Google Search tool can be used only by itself. Please remove other tools from the tools list."
+            )
+
+        return exists
+
+    @staticmethod
+    def _unwrap_references(function_parameters: dict[str, Any]) -> dict[str, Any]:
+        if "properties" not in function_parameters:
+            return function_parameters
+
+        function_parameters_copy = copy.deepcopy(function_parameters)
+
+        for property_name, property_value in function_parameters["properties"].items():
+            if "$defs" in property_value:
+                function_parameters_copy["properties"][property_name] = resolve_json_references(property_value)
+                function_parameters_copy["properties"][property_name].pop("$defs")
+
+        return function_parameters_copy
+
+    def _tools_to_gemini_tools(self, tools: list[dict[str, Any]]) -> list[Tool]:
+        """Create Gemini tools (as typically requires Callables)"""
+        if self._check_if_prebuilt_google_search_tool_exists(tools) and not self.use_vertexai:
+            return [Tool(google_search=GoogleSearch())]
+
+        functions = []
+        for tool in tools:
+            if self.use_vertexai:
+                tool["function"]["parameters"] = GeminiClient._convert_type_null_to_nullable(
+                    tool["function"]["parameters"]
+                )
+                function_parameters = GeminiClient._unwrap_references(tool["function"]["parameters"])
+                function = vaiFunctionDeclaration(
+                    name=tool["function"]["name"],
+                    description=tool["function"]["description"],
+                    parameters=function_parameters,
+                )
+            else:
+                function = GeminiClient._create_gemini_function_declaration(tool)
+            functions.append(function)
+
+        if self.use_vertexai:
+            return [vaiTool(function_declarations=functions)]
+        else:
+            return [Tool(function_declarations=functions)]
+
+    @staticmethod
+    def _create_gemini_function_declaration(tool: dict) -> FunctionDeclaration:
+        function_declaration = FunctionDeclaration()
+        function_declaration.name = tool["function"]["name"]
+        function_declaration.description = tool["function"]["description"]
+        if len(tool["function"]["parameters"]["properties"]) != 0:
+            function_declaration.parameters = GeminiClient._create_gemini_function_parameters(
+                copy.deepcopy(tool["function"]["parameters"])
+            )
+
+        return function_declaration
+
+    @staticmethod
+    def _create_gemini_function_declaration_schema(json_data) -> Schema:
+        """Recursively creates Schema objects for FunctionDeclaration."""
+        param_schema = Schema()
+        param_type = json_data["type"]
+
+        """
+        TYPE_UNSPECIFIED = 0
+        STRING = 1
+        INTEGER = 2
+        NUMBER = 3
+        OBJECT = 4
+        ARRAY = 5
+        BOOLEAN = 6
+        """
+
+        if param_type == "integer":
+            param_schema.type = Type.INTEGER
+        elif param_type == "number":
+            param_schema.type = Type.NUMBER
+        elif param_type == "string":
+            param_schema.type = Type.STRING
+        elif param_type == "boolean":
+            param_schema.type = Type.BOOLEAN
+        elif param_type == "array":
+            param_schema.type = Type.ARRAY
+            if "items" in json_data:
+                param_schema.items = GeminiClient._create_gemini_function_declaration_schema(json_data["items"])
+            else:
+                print("Warning: Array schema missing 'items' definition.")
+        elif param_type == "object":
+            param_schema.type = Type.OBJECT
+            param_schema.properties = {}
+            if "properties" in json_data:
+                for prop_name, prop_data in json_data["properties"].items():
+                    param_schema.properties[prop_name] = GeminiClient._create_gemini_function_declaration_schema(
+                        prop_data
+                    )
+                else:
+                    print("Warning: Object schema missing 'properties' definition.")
+
+        elif param_type in ("null", "any"):
+            param_schema.type = Type.STRING  # Treating these as strings for simplicity
+        else:
+            print(f"Warning: Unsupported parameter type '{param_type}'.")
+
+        if "description" in json_data:
+            param_schema.description = json_data["description"]
+
+        return param_schema
+
+    @staticmethod
+    def _create_gemini_function_parameters(function_parameter: dict[str, any]) -> dict[str, any]:
+        """Convert function parameters to Gemini format, recursive"""
+        function_parameter = GeminiClient._unwrap_references(function_parameter)
+
+        if "type" in function_parameter:
+            function_parameter["type"] = function_parameter["type"].upper()
+            # If the schema was created from pydantic BaseModel, it will "title" attribute which needs to be removed
+            function_parameter.pop("title", None)
+
+        # Parameter properties and items
+        if "properties" in function_parameter:
+            for key in function_parameter["properties"]:
+                function_parameter["properties"][key] = GeminiClient._create_gemini_function_parameters(
+                    function_parameter["properties"][key]
+                )
+
+        if "items" in function_parameter:
+            function_parameter["items"] = GeminiClient._create_gemini_function_parameters(function_parameter["items"])
+
+        # Remove any attributes not needed
+        for attr in ["default"]:
+            if attr in function_parameter:
+                del function_parameter[attr]
+
+        return function_parameter
+
+    @staticmethod
+    def _to_vertexai_safety_settings(safety_settings):
+        """Convert safety settings to VertexAI format if needed,
+        like when specifying them in the OAI_CONFIG_LIST
+        """
+        if isinstance(safety_settings, list) and all([
+            isinstance(safety_setting, dict) and not isinstance(safety_setting, VertexAISafetySetting)
+            for safety_setting in safety_settings
+        ]):
+            vertexai_safety_settings = []
+            for safety_setting in safety_settings:
+                if safety_setting["category"] not in VertexAIHarmCategory.__members__:
+                    invalid_category = safety_setting["category"]
+                    logger.error(f"Safety setting category {invalid_category} is invalid")
+                elif safety_setting["threshold"] not in VertexAIHarmBlockThreshold.__members__:
+                    invalid_threshold = safety_setting["threshold"]
+                    logger.error(f"Safety threshold {invalid_threshold} is invalid")
+                else:
+                    vertexai_safety_setting = VertexAISafetySetting(
+                        category=safety_setting["category"],
+                        threshold=safety_setting["threshold"],
+                    )
+                    vertexai_safety_settings.append(vertexai_safety_setting)
+            return vertexai_safety_settings
+        else:
+            return safety_settings
+
+    @staticmethod
+    def _to_json_or_str(data: str) -> dict | str:
+        try:
+            json_data = json.loads(data)
+            return json_data
+        except (json.JSONDecodeError, ValidationError):
+            return data
+
+
+@require_optional_import(["PIL"], "gemini")
+def get_image_data(image_file: str, use_b64=True) -> bytes:
+    if image_file.startswith("http://") or image_file.startswith("https://"):
+        response = requests.get(image_file)
+        content = response.content
+    elif re.match(r"data:image/(?:png|jpeg);base64,", image_file):
+        return re.sub(r"data:image/(?:png|jpeg);base64,", "", image_file)
+    else:
+        image = Image.open(image_file).convert("RGB")
+        buffered = BytesIO()
+        image.save(buffered, format="PNG")
+        content = buffered.getvalue()
+
+    if use_b64:
+        return base64.b64encode(content).decode("utf-8")
+    else:
+        return content
+
+
+def _format_json_response(response: Any, original_answer: str) -> str:
+    """Formats the JSON response for structured outputs using the format method if it exists."""
+    return response.format() if isinstance(response, FormatterProtocol) else original_answer
+
+
+def calculate_gemini_cost(use_vertexai: bool, input_tokens: int, output_tokens: int, model_name: str) -> float:
+    def total_cost_mil(cost_per_mil_input: float, cost_per_mil_output: float):
+        # Cost per million
+        return cost_per_mil_input * input_tokens / 1e6 + cost_per_mil_output * output_tokens / 1e6
+
+    def total_cost_k(cost_per_k_input: float, cost_per_k_output: float):
+        # Cost per thousand
+        return cost_per_k_input * input_tokens / 1e3 + cost_per_k_output * output_tokens / 1e3
+
+    model_name = model_name.lower()
+    up_to_128k = input_tokens <= 128000
+    up_to_200k = input_tokens <= 200000
+
+    if use_vertexai:
+        # Vertex AI pricing - based on Text input
+        # https://cloud.google.com/vertex-ai/generative-ai/pricing#vertex-ai-pricing
+
+        if (
+            "gemini-2.5-pro-preview-03-25" in model_name
+            or "gemini-2.5-pro-exp-03-25" in model_name
+            or "gemini-2.5-pro-preview-05-06" in model_name
+        ):
+            if up_to_200k:
+                return total_cost_mil(1.25, 10)
+            else:
+                return total_cost_mil(2.5, 15)
+
+        elif "gemini-2.5-flash-preview-04-17" in model_name:
+            return total_cost_mil(0.15, 0.6)  # NON-THINKING OUTPUT PRICE, $3 FOR THINKING!
+
+        elif "gemini-2.0-flash-lite" in model_name:
+            return total_cost_mil(0.075, 0.3)
+
+        elif "gemini-2.0-flash" in model_name:
+            return total_cost_mil(0.15, 0.6)
+
+        elif "gemini-1.5-flash" in model_name:
+            if up_to_128k:
+                return total_cost_k(0.00001875, 0.000075)
+            else:
+                return total_cost_k(0.0000375, 0.00015)
+
+        elif "gemini-1.5-pro" in model_name:
+            if up_to_128k:
+                return total_cost_k(0.0003125, 0.00125)
+            else:
+                return total_cost_k(0.000625, 0.0025)
+
+        elif "gemini-1.0-pro" in model_name:
+            return total_cost_k(0.000125, 0.00001875)
+
+        else:
+            warnings.warn(
+                f"Cost calculation is not implemented for model {model_name}. Cost will be calculated zero.",
+                UserWarning,
+            )
+            return 0
+
+    else:
+        # Non-Vertex AI pricing
+
+        if (
+            "gemini-2.5-pro-preview-03-25" in model_name
+            or "gemini-2.5-pro-exp-03-25" in model_name
+            or "gemini-2.5-pro-preview-05-06" in model_name
+        ):
+            # https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-pro-preview
+            if up_to_200k:
+                return total_cost_mil(1.25, 10)
+            else:
+                return total_cost_mil(2.5, 15)
+
+        elif "gemini-2.5-flash-preview-04-17" in model_name:
+            # https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-flash
+            return total_cost_mil(0.15, 0.6)
+
+        elif "gemini-2.0-flash-lite" in model_name:
+            # https://ai.google.dev/gemini-api/docs/pricing#gemini-2.0-flash-lite
+            return total_cost_mil(0.075, 0.3)
+
+        elif "gemini-2.0-flash" in model_name:
+            # https://ai.google.dev/gemini-api/docs/pricing#gemini-2.0-flash
+            return total_cost_mil(0.1, 0.4)
+
+        elif "gemini-1.5-flash-8b" in model_name:
+            # https://ai.google.dev/pricing#1_5flash-8B
+            if up_to_128k:
+                return total_cost_mil(0.0375, 0.15)
+            else:
+                return total_cost_mil(0.075, 0.3)
+
+        elif "gemini-1.5-flash" in model_name:
+            # https://ai.google.dev/pricing#1_5flash
+            if up_to_128k:
+                return total_cost_mil(0.075, 0.3)
+            else:
+                return total_cost_mil(0.15, 0.6)
+
+        elif "gemini-1.5-pro" in model_name:
+            # https://ai.google.dev/pricing#1_5pro
+            if up_to_128k:
+                return total_cost_mil(1.25, 5.0)
+            else:
+                return total_cost_mil(2.50, 10.0)
+
+        elif "gemini-1.0-pro" in model_name:
+            # https://ai.google.dev/pricing#1_5pro
+            return total_cost_mil(0.50, 1.5)
+
+        else:
+            warnings.warn(
+                f"Cost calculation is not implemented for model {model_name}. Cost will be calculated zero.",
+                UserWarning,
+            )
+            return 0
diff --git a/mm_agents/coact/autogen/oai/gemini_types.py b/mm_agents/coact/autogen/oai/gemini_types.py
new file mode 100644
index 0000000..1af7ee3
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/gemini_types.py
@@ -0,0 +1,156 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import enum
+import warnings
+from typing import Any, Optional, Type, TypeVar, Union, get_args, get_origin
+
+from pydantic import BaseModel as BaseModel
+from pydantic import ConfigDict, Field, alias_generators
+
+
+def _remove_extra_fields(model: Any, response: dict[str, object]) -> None:
+    """Removes extra fields from the response that are not in the model.
+
+    Mutates the response in place.
+    """
+
+    key_values = list(response.items())
+
+    for key, value in key_values:
+        # Need to convert to snake case to match model fields names
+        # ex: UsageMetadata
+        alias_map = {field_info.alias: key for key, field_info in model.model_fields.items()}
+
+        if key not in model.model_fields and key not in alias_map:
+            response.pop(key)
+            continue
+
+        key = alias_map.get(key, key)
+
+        annotation = model.model_fields[key].annotation
+
+        # Get the BaseModel if Optional
+        if get_origin(annotation) is Union:
+            annotation = get_args(annotation)[0]
+
+        # if dict, assume BaseModel but also check that field type is not dict
+        # example: FunctionCall.args
+        if isinstance(value, dict) and get_origin(annotation) is not dict:
+            _remove_extra_fields(annotation, value)
+        elif isinstance(value, list):
+            for item in value:
+                # assume a list of dict is list of BaseModel
+                if isinstance(item, dict):
+                    _remove_extra_fields(get_args(annotation)[0], item)
+
+
+T = TypeVar("T", bound="BaseModel")
+
+
+class CommonBaseModel(BaseModel):
+    model_config = ConfigDict(
+        alias_generator=alias_generators.to_camel,
+        populate_by_name=True,
+        from_attributes=True,
+        protected_namespaces=(),
+        extra="forbid",
+        # This allows us to use arbitrary types in the model. E.g. PIL.Image.
+        arbitrary_types_allowed=True,
+        ser_json_bytes="base64",
+        val_json_bytes="base64",
+        ignored_types=(TypeVar,),
+    )
+
+    @classmethod
+    def _from_response(cls: Type[T], *, response: dict[str, object], kwargs: dict[str, object]) -> T:
+        # To maintain forward compatibility, we need to remove extra fields from
+        # the response.
+        # We will provide another mechanism to allow users to access these fields.
+        _remove_extra_fields(cls, response)
+        validated_response = cls.model_validate(response)
+        return validated_response
+
+    def to_json_dict(self) -> dict[str, object]:
+        return self.model_dump(exclude_none=True, mode="json")
+
+
+class CaseInSensitiveEnum(str, enum.Enum):
+    """Case insensitive enum."""
+
+    @classmethod
+    def _missing_(cls, value: Any) -> Optional["CaseInSensitiveEnum"]:
+        try:
+            return cls[value.upper()]  # Try to access directly with uppercase
+        except KeyError:
+            try:
+                return cls[value.lower()]  # Try to access directly with lowercase
+            except KeyError:
+                warnings.warn(f"{value} is not a valid {cls.__name__}")
+                try:
+                    # Creating a enum instance based on the value
+                    # We need to use super() to avoid infinite recursion.
+                    unknown_enum_val = super().__new__(cls, value)
+                    unknown_enum_val._name_ = str(value)  # pylint: disable=protected-access
+                    unknown_enum_val._value_ = value  # pylint: disable=protected-access
+                    return unknown_enum_val
+                except:  # noqa: E722
+                    return None
+
+
+class FunctionCallingConfigMode(CaseInSensitiveEnum):
+    """Config for the function calling config mode."""
+
+    MODE_UNSPECIFIED = "MODE_UNSPECIFIED"
+    AUTO = "AUTO"
+    ANY = "ANY"
+    NONE = "NONE"
+
+
+class LatLng(CommonBaseModel):
+    """An object that represents a latitude/longitude pair.
+
+    This is expressed as a pair of doubles to represent degrees latitude and
+    degrees longitude. Unless specified otherwise, this object must conform to the
+    <a href="https://en.wikipedia.org/wiki/World_Geodetic_System#1984_version">
+    WGS84 standard</a>. Values must be within normalized ranges.
+    """
+
+    latitude: Optional[float] = Field(
+        default=None,
+        description="""The latitude in degrees. It must be in the range [-90.0, +90.0].""",
+    )
+    longitude: Optional[float] = Field(
+        default=None,
+        description="""The longitude in degrees. It must be in the range [-180.0, +180.0]""",
+    )
+
+
+class FunctionCallingConfig(CommonBaseModel):
+    """Function calling config."""
+
+    mode: Optional[FunctionCallingConfigMode] = Field(default=None, description="""Optional. Function calling mode.""")
+    allowed_function_names: Optional[list[str]] = Field(
+        default=None,
+        description="""Optional. Function names to call. Only set when the Mode is ANY. Function names should match [FunctionDeclaration.name]. With mode set to ANY, model will predict a function call from the set of function names provided.""",
+    )
+
+
+class RetrievalConfig(CommonBaseModel):
+    """Retrieval config."""
+
+    lat_lng: Optional[LatLng] = Field(default=None, description="""Optional. The location of the user.""")
+    language_code: Optional[str] = Field(default=None, description="""The language code of the user.""")
+
+
+class ToolConfig(CommonBaseModel):
+    """Tool config.
+
+    This config is shared for all tools provided in the request.
+    """
+
+    function_calling_config: Optional[FunctionCallingConfig] = Field(
+        default=None, description="""Optional. Function calling config."""
+    )
+    retrieval_config: Optional[RetrievalConfig] = Field(default=None, description="""Optional. Retrieval config.""")
diff --git a/mm_agents/coact/autogen/oai/groq.py b/mm_agents/coact/autogen/oai/groq.py
new file mode 100644
index 0000000..1422cc5
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/groq.py
@@ -0,0 +1,305 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Groq's API.
+
+Example:
+    ```python
+    llm_config = {
+        "config_list": [{"api_type": "groq", "model": "mixtral-8x7b-32768", "api_key": os.environ.get("GROQ_API_KEY")}]
+    }
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Groq's python library using: pip install --upgrade groq
+
+Resources:
+- https://console.groq.com/docs/quickstart
+"""
+
+from __future__ import annotations
+
+import copy
+import os
+import time
+import warnings
+from typing import Any, Literal, Optional
+
+from pydantic import Field
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import should_hide_tools, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    from groq import Groq, Stream
+
+# Cost per thousand tokens - Input / Output (NOTE: Convert $/Million to $/K)
+GROQ_PRICING_1K = {
+    "llama3-70b-8192": (0.00059, 0.00079),
+    "mixtral-8x7b-32768": (0.00024, 0.00024),
+    "llama3-8b-8192": (0.00005, 0.00008),
+    "gemma-7b-it": (0.00007, 0.00007),
+}
+
+
+@register_llm_config
+class GroqLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["groq"] = "groq"
+    frequency_penalty: float = Field(default=None, ge=-2, le=2)
+    max_tokens: int = Field(default=None, ge=0)
+    presence_penalty: float = Field(default=None, ge=-2, le=2)
+    seed: int = Field(default=None)
+    stream: bool = Field(default=False)
+    temperature: float = Field(default=1, ge=0, le=2)
+    top_p: float = Field(default=None)
+    hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
+    tool_choice: Optional[Literal["none", "auto", "required"]] = None
+
+    def create_client(self):
+        raise NotImplementedError("GroqLLMConfigEntry.create_client is not implemented.")
+
+
+class GroqClient:
+    """Client for Groq's API."""
+
+    def __init__(self, **kwargs):
+        """Requires api_key or environment variable to be set
+
+        Args:
+            **kwargs: Additional parameters to pass to the Groq API
+        """
+        # Ensure we have the api_key upon instantiation
+        self.api_key = kwargs.get("api_key")
+        if not self.api_key:
+            self.api_key = os.getenv("GROQ_API_KEY")
+
+        assert self.api_key, (
+            "Please include the api_key in your config list entry for Groq or set the GROQ_API_KEY env variable."
+        )
+
+        if "response_format" in kwargs and kwargs["response_format"] is not None:
+            warnings.warn("response_format is not supported for Groq API, it will be ignored.", UserWarning)
+        self.base_url = kwargs.get("base_url")
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Groq API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        groq_params = {}
+
+        # Check that we have what we need to use Groq's API
+        # We won't enforce the available models as they are likely to change
+        groq_params["model"] = params.get("model")
+        assert groq_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Groq model to use."
+        )
+
+        # Validate allowed Groq parameters
+        # https://console.groq.com/docs/api-reference#chat
+        groq_params["frequency_penalty"] = validate_parameter(
+            params, "frequency_penalty", (int, float), True, None, (-2, 2), None
+        )
+        groq_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, None, (0, None), None)
+        groq_params["presence_penalty"] = validate_parameter(
+            params, "presence_penalty", (int, float), True, None, (-2, 2), None
+        )
+        groq_params["seed"] = validate_parameter(params, "seed", int, True, None, None, None)
+        groq_params["stream"] = validate_parameter(params, "stream", bool, True, False, None, None)
+        groq_params["temperature"] = validate_parameter(params, "temperature", (int, float), True, 1, (0, 2), None)
+        groq_params["top_p"] = validate_parameter(params, "top_p", (int, float), True, None, None, None)
+        if "tool_choice" in params:
+            groq_params["tool_choice"] = validate_parameter(
+                params, "tool_choice", str, True, None, None, ["none", "auto", "required"]
+            )
+
+        # Groq parameters not supported by their models yet, ignoring
+        # logit_bias, logprobs, top_logprobs
+
+        # Groq parameters we are ignoring:
+        # n (must be 1), response_format (to enforce JSON but needs prompting as well), user,
+        # parallel_tool_calls (defaults to True), stop
+        # function_call (deprecated), functions (deprecated)
+        # tool_choice (none if no tools, auto if there are tools)
+
+        return groq_params
+
+    @require_optional_import("groq", "groq")
+    def create(self, params: dict) -> ChatCompletion:
+        messages = params.get("messages", [])
+
+        # Convert AG2 messages to Groq messages
+        groq_messages = oai_messages_to_groq_messages(messages)
+
+        # Parse parameters to the Groq API's parameters
+        groq_params = self.parse_params(params)
+
+        # Add tools to the call if we have them and aren't hiding them
+        if "tools" in params:
+            hide_tools = validate_parameter(
+                params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
+            )
+            if not should_hide_tools(groq_messages, params["tools"], hide_tools):
+                groq_params["tools"] = params["tools"]
+
+        groq_params["messages"] = groq_messages
+
+        # We use chat model by default, and set max_retries to 5 (in line with typical retries loop)
+        client = Groq(api_key=self.api_key, max_retries=5, base_url=self.base_url)
+
+        # Token counts will be returned
+        prompt_tokens = 0
+        completion_tokens = 0
+        total_tokens = 0
+
+        # Streaming tool call recommendations
+        streaming_tool_calls = []
+
+        ans = None
+        response = client.chat.completions.create(**groq_params)
+        if groq_params["stream"]:
+            # Read in the chunks as they stream, taking in tool_calls which may be across
+            # multiple chunks if more than one suggested
+            ans = ""
+            for chunk in response:
+                ans = ans + (chunk.choices[0].delta.content or "")
+
+                if chunk.choices[0].delta.tool_calls:
+                    # We have a tool call recommendation
+                    for tool_call in chunk.choices[0].delta.tool_calls:
+                        streaming_tool_calls.append(
+                            ChatCompletionMessageToolCall(
+                                id=tool_call.id,
+                                function={
+                                    "name": tool_call.function.name,
+                                    "arguments": tool_call.function.arguments,
+                                },
+                                type="function",
+                            )
+                        )
+
+                if chunk.choices[0].finish_reason:
+                    prompt_tokens = chunk.x_groq.usage.prompt_tokens
+                    completion_tokens = chunk.x_groq.usage.completion_tokens
+                    total_tokens = chunk.x_groq.usage.total_tokens
+        else:
+            # Non-streaming finished
+            ans: str = response.choices[0].message.content
+            prompt_tokens = response.usage.prompt_tokens
+            completion_tokens = response.usage.completion_tokens
+            total_tokens = response.usage.total_tokens
+
+        if response is not None:
+            if isinstance(response, Stream):
+                # Streaming response
+                if chunk.choices[0].finish_reason == "tool_calls":
+                    groq_finish = "tool_calls"
+                    tool_calls = streaming_tool_calls
+                else:
+                    groq_finish = "stop"
+                    tool_calls = None
+
+                response_content = ans
+                response_id = chunk.id
+            else:
+                # Non-streaming response
+                # If we have tool calls as the response, populate completed tool calls for our return OAI response
+                if response.choices[0].finish_reason == "tool_calls":
+                    groq_finish = "tool_calls"
+                    tool_calls = []
+                    for tool_call in response.choices[0].message.tool_calls:
+                        tool_calls.append(
+                            ChatCompletionMessageToolCall(
+                                id=tool_call.id,
+                                function={"name": tool_call.function.name, "arguments": tool_call.function.arguments},
+                                type="function",
+                            )
+                        )
+                else:
+                    groq_finish = "stop"
+                    tool_calls = None
+
+                response_content = response.choices[0].message.content
+                response_id = response.id
+        else:
+            raise RuntimeError("Failed to get response from Groq after retrying 5 times.")
+
+        # 3. convert output
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=response_content,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=groq_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response_id,
+            model=groq_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=total_tokens,
+            ),
+            cost=calculate_groq_cost(prompt_tokens, completion_tokens, groq_params["model"]),
+        )
+
+        return response_oai
+
+
+def oai_messages_to_groq_messages(messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Convert messages from OAI format to Groq's format.
+    We correct for any specific role orders and types.
+    """
+    groq_messages = copy.deepcopy(messages)
+
+    # Remove the name field
+    for message in groq_messages:
+        if "name" in message:
+            message.pop("name", None)
+
+    return groq_messages
+
+
+def calculate_groq_cost(input_tokens: int, output_tokens: int, model: str) -> float:
+    """Calculate the cost of the completion using the Groq pricing."""
+    total = 0.0
+
+    if model in GROQ_PRICING_1K:
+        input_cost_per_k, output_cost_per_k = GROQ_PRICING_1K[model]
+        input_cost = (input_tokens / 1000) * input_cost_per_k
+        output_cost = (output_tokens / 1000) * output_cost_per_k
+        total = input_cost + output_cost
+    else:
+        warnings.warn(f"Cost calculation not available for model {model}", UserWarning)
+
+    return total
diff --git a/mm_agents/coact/autogen/oai/mistral.py b/mm_agents/coact/autogen/oai/mistral.py
new file mode 100644
index 0000000..dcb69ca
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/mistral.py
@@ -0,0 +1,303 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Mistral.AI's API.
+
+Example:
+    ```python
+    llm_config = {
+        "config_list": [
+            {"api_type": "mistral", "model": "open-mixtral-8x22b", "api_key": os.environ.get("MISTRAL_API_KEY")}
+        ]
+    }
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Mistral.AI python library using: pip install --upgrade mistralai
+
+Resources:
+- https://docs.mistral.ai/getting-started/quickstart/
+
+NOTE: Requires mistralai package version >= 1.0.1
+"""
+
+import json
+import os
+import time
+import warnings
+from typing import Any, Literal, Optional, Union
+
+from pydantic import Field
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import should_hide_tools, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    # Mistral libraries
+    # pip install mistralai
+    from mistralai import (
+        AssistantMessage,
+        Function,
+        FunctionCall,
+        Mistral,
+        SystemMessage,
+        ToolCall,
+        ToolMessage,
+        UserMessage,
+    )
+
+
+@register_llm_config
+class MistralLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["mistral"] = "mistral"
+    temperature: float = Field(default=0.7)
+    top_p: Optional[float] = None
+    max_tokens: Optional[int] = Field(default=None, ge=0)
+    safe_prompt: bool = False
+    random_seed: Optional[int] = None
+    stream: bool = False
+    hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
+    tool_choice: Optional[Literal["none", "auto", "any"]] = None
+
+    def create_client(self):
+        raise NotImplementedError("MistralLLMConfigEntry.create_client is not implemented.")
+
+
+@require_optional_import("mistralai", "mistral")
+class MistralAIClient:
+    """Client for Mistral.AI's API."""
+
+    def __init__(self, **kwargs):
+        """Requires api_key or environment variable to be set
+
+        Args:
+            **kwargs: Additional keyword arguments to pass to the Mistral client.
+        """
+        # Ensure we have the api_key upon instantiation
+        self.api_key = kwargs.get("api_key")
+        if not self.api_key:
+            self.api_key = os.getenv("MISTRAL_API_KEY", None)
+
+        assert self.api_key, (
+            "Please specify the 'api_key' in your config list entry for Mistral or set the MISTRAL_API_KEY env variable."
+        )
+
+        if "response_format" in kwargs and kwargs["response_format"] is not None:
+            warnings.warn("response_format is not supported for Mistral.AI, it will be ignored.", UserWarning)
+
+        self._client = Mistral(api_key=self.api_key)
+
+    def message_retrieval(self, response: ChatCompletion) -> Union[list[str], list[ChatCompletionMessage]]:
+        """Retrieve the messages from the response."""
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @require_optional_import("mistralai", "mistral")
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Mistral.AI API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        mistral_params = {}
+
+        # 1. Validate models
+        mistral_params["model"] = params.get("model")
+        assert mistral_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Mistral.ai model to use."
+        )
+
+        # 2. Validate allowed Mistral.AI parameters
+        mistral_params["temperature"] = validate_parameter(params, "temperature", (int, float), True, 0.7, None, None)
+        mistral_params["top_p"] = validate_parameter(params, "top_p", (int, float), True, None, None, None)
+        mistral_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, None, (0, None), None)
+        mistral_params["safe_prompt"] = validate_parameter(
+            params, "safe_prompt", bool, False, False, None, [True, False]
+        )
+        mistral_params["random_seed"] = validate_parameter(params, "random_seed", int, True, None, False, None)
+        mistral_params["tool_choice"] = validate_parameter(
+            params, "tool_choice", str, False, None, None, ["none", "auto", "any"]
+        )
+
+        # TODO
+        if params.get("stream", False):
+            warnings.warn(
+                "Streaming is not currently supported, streaming will be disabled.",
+                UserWarning,
+            )
+
+        # 3. Convert messages to Mistral format
+        mistral_messages = []
+        tool_call_ids = {}  # tool call ids to function name mapping
+        for message in params["messages"]:
+            if message["role"] == "assistant" and "tool_calls" in message and message["tool_calls"] is not None:
+                # Convert OAI ToolCall to Mistral ToolCall
+                mistral_messages_tools = []
+                for toolcall in message["tool_calls"]:
+                    mistral_messages_tools.append(
+                        ToolCall(
+                            id=toolcall["id"],
+                            function=FunctionCall(
+                                name=toolcall["function"]["name"],
+                                arguments=json.loads(toolcall["function"]["arguments"]),
+                            ),
+                        )
+                    )
+
+                mistral_messages.append(AssistantMessage(content="", tool_calls=mistral_messages_tools))
+
+                # Map tool call id to the function name
+                for tool_call in message["tool_calls"]:
+                    tool_call_ids[tool_call["id"]] = tool_call["function"]["name"]
+
+            elif message["role"] == "system":
+                if len(mistral_messages) > 0 and mistral_messages[-1].role == "assistant":
+                    # System messages can't appear after an Assistant message, so use a UserMessage
+                    mistral_messages.append(UserMessage(content=message["content"]))
+                else:
+                    mistral_messages.append(SystemMessage(content=message["content"]))
+            elif message["role"] == "assistant":
+                mistral_messages.append(AssistantMessage(content=message["content"]))
+            elif message["role"] == "user":
+                mistral_messages.append(UserMessage(content=message["content"]))
+
+            elif message["role"] == "tool":
+                # Indicates the result of a tool call, the name is the function name called
+                mistral_messages.append(
+                    ToolMessage(
+                        name=tool_call_ids[message["tool_call_id"]],
+                        content=message["content"],
+                        tool_call_id=message["tool_call_id"],
+                    )
+                )
+            else:
+                warnings.warn(f"Unknown message role {message['role']}", UserWarning)
+
+        # 4. Last message needs to be user or tool, if not, add a "please continue" message
+        if not isinstance(mistral_messages[-1], UserMessage) and not isinstance(mistral_messages[-1], ToolMessage):
+            mistral_messages.append(UserMessage(content="Please continue."))
+
+        mistral_params["messages"] = mistral_messages
+
+        # 5. Add tools to the call if we have them and aren't hiding them
+        if "tools" in params:
+            hide_tools = validate_parameter(
+                params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
+            )
+            if not should_hide_tools(params["messages"], params["tools"], hide_tools):
+                mistral_params["tools"] = tool_def_to_mistral(params["tools"])
+
+        return mistral_params
+
+    @require_optional_import("mistralai", "mistral")
+    def create(self, params: dict[str, Any]) -> ChatCompletion:
+        # 1. Parse parameters to Mistral.AI API's parameters
+        mistral_params = self.parse_params(params)
+
+        # 2. Call Mistral.AI API
+        mistral_response = self._client.chat.complete(**mistral_params)
+        # TODO: Handle streaming
+
+        # 3. Convert Mistral response to OAI compatible format
+        if mistral_response.choices[0].finish_reason == "tool_calls":
+            mistral_finish = "tool_calls"
+            tool_calls = []
+            for tool_call in mistral_response.choices[0].message.tool_calls:
+                tool_calls.append(
+                    ChatCompletionMessageToolCall(
+                        id=tool_call.id,
+                        function={"name": tool_call.function.name, "arguments": tool_call.function.arguments},
+                        type="function",
+                    )
+                )
+        else:
+            mistral_finish = "stop"
+            tool_calls = None
+
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=mistral_response.choices[0].message.content,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=mistral_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=mistral_response.id,
+            model=mistral_response.model,
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=mistral_response.usage.prompt_tokens,
+                completion_tokens=mistral_response.usage.completion_tokens,
+                total_tokens=mistral_response.usage.prompt_tokens + mistral_response.usage.completion_tokens,
+            ),
+            cost=calculate_mistral_cost(
+                mistral_response.usage.prompt_tokens, mistral_response.usage.completion_tokens, mistral_response.model
+            ),
+        )
+
+        return response_oai
+
+    @staticmethod
+    def get_usage(response: ChatCompletion) -> dict:
+        return {
+            "prompt_tokens": response.usage.prompt_tokens if response.usage is not None else 0,
+            "completion_tokens": response.usage.completion_tokens if response.usage is not None else 0,
+            "total_tokens": (
+                response.usage.prompt_tokens + response.usage.completion_tokens if response.usage is not None else 0
+            ),
+            "cost": response.cost if hasattr(response, "cost") else 0,
+            "model": response.model,
+        }
+
+
+@require_optional_import("mistralai", "mistral")
+def tool_def_to_mistral(tool_definitions: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Converts AG2 tool definition to a mistral tool format"""
+    mistral_tools = []
+
+    for autogen_tool in tool_definitions:
+        mistral_tool = {
+            "type": "function",
+            "function": Function(
+                name=autogen_tool["function"]["name"],
+                description=autogen_tool["function"]["description"],
+                parameters=autogen_tool["function"]["parameters"],
+            ),
+        }
+
+        mistral_tools.append(mistral_tool)
+
+    return mistral_tools
+
+
+def calculate_mistral_cost(input_tokens: int, output_tokens: int, model_name: str) -> float:
+    """Calculate the cost of the mistral response."""
+    # Prices per 1 thousand tokens
+    # https://mistral.ai/technology/
+    model_cost_map = {
+        "open-mistral-7b": {"input": 0.00025, "output": 0.00025},
+        "open-mixtral-8x7b": {"input": 0.0007, "output": 0.0007},
+        "open-mixtral-8x22b": {"input": 0.002, "output": 0.006},
+        "mistral-small-latest": {"input": 0.001, "output": 0.003},
+        "mistral-medium-latest": {"input": 0.00275, "output": 0.0081},
+        "mistral-large-latest": {"input": 0.0003, "output": 0.0003},
+        "mistral-large-2407": {"input": 0.0003, "output": 0.0003},
+        "open-mistral-nemo-2407": {"input": 0.0003, "output": 0.0003},
+        "codestral-2405": {"input": 0.001, "output": 0.003},
+    }
+
+    # Ensure we have the model they are using and return the total cost
+    if model_name in model_cost_map:
+        costs = model_cost_map[model_name]
+
+        return (input_tokens * costs["input"] / 1000) + (output_tokens * costs["output"] / 1000)
+    else:
+        warnings.warn(f"Cost calculation is not implemented for model {model_name}, will return $0.", UserWarning)
+        return 0
diff --git a/mm_agents/coact/autogen/oai/oai_models/__init__.py b/mm_agents/coact/autogen/oai/oai_models/__init__.py
new file mode 100644
index 0000000..8d6a7c5
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/__init__.py
@@ -0,0 +1,11 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .chat_completion import ChatCompletionExtended as ChatCompletion
+from .chat_completion import Choice
+from .chat_completion_message import ChatCompletionMessage
+from .chat_completion_message_tool_call import ChatCompletionMessageToolCall
+from .completion_usage import CompletionUsage
+
+__all__ = ["ChatCompletion", "ChatCompletionMessage", "ChatCompletionMessageToolCall", "Choice", "CompletionUsage"]
diff --git a/mm_agents/coact/autogen/oai/oai_models/_models.py b/mm_agents/coact/autogen/oai/oai_models/_models.py
new file mode 100644
index 0000000..6a5f0cd
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/_models.py
@@ -0,0 +1,16 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/main/src/openai/_models.py
+
+import pydantic
+import pydantic.generics
+from pydantic import ConfigDict
+from typing_extensions import ClassVar
+
+__all__ = ["BaseModel"]
+
+
+class BaseModel(pydantic.BaseModel):
+    model_config: ClassVar[ConfigDict] = ConfigDict(extra="allow")
diff --git a/mm_agents/coact/autogen/oai/oai_models/chat_completion.py b/mm_agents/coact/autogen/oai/oai_models/chat_completion.py
new file mode 100644
index 0000000..fd1821a
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/chat_completion.py
@@ -0,0 +1,87 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/3e69750d47df4f0759d4a28ddc68e4b38756d9ca/src/openai/types/chat/chat_completion.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from typing import Any, Callable, List, Optional
+
+from typing_extensions import Literal
+
+from ._models import BaseModel
+from .chat_completion_message import ChatCompletionMessage
+from .chat_completion_token_logprob import ChatCompletionTokenLogprob
+from .completion_usage import CompletionUsage
+
+__all__ = ["ChatCompletion", "Choice", "ChoiceLogprobs"]
+
+
+class ChoiceLogprobs(BaseModel):
+    content: Optional[List[ChatCompletionTokenLogprob]] = None
+    """A list of message content tokens with log probability information."""
+
+    refusal: Optional[List[ChatCompletionTokenLogprob]] = None
+    """A list of message refusal tokens with log probability information."""
+
+
+class Choice(BaseModel):
+    finish_reason: Literal["stop", "length", "tool_calls", "content_filter", "function_call"]
+    """The reason the model stopped generating tokens.
+
+    This will be `stop` if the model hit a natural stop point or a provided stop
+    sequence, `length` if the maximum number of tokens specified in the request was
+    reached, `content_filter` if content was omitted due to a flag from our content
+    filters, `tool_calls` if the model called a tool, or `function_call`
+    (deprecated) if the model called a function.
+    """
+
+    index: int
+    """The index of the choice in the list of choices."""
+
+    logprobs: Optional[ChoiceLogprobs] = None
+    """Log probability information for the choice."""
+
+    message: ChatCompletionMessage
+    """A chat completion message generated by the model."""
+
+
+class ChatCompletion(BaseModel):
+    id: str
+    """A unique identifier for the chat completion."""
+
+    choices: List[Choice]
+    """A list of chat completion choices.
+
+    Can be more than one if `n` is greater than 1.
+    """
+
+    created: int
+    """The Unix timestamp (in seconds) of when the chat completion was created."""
+
+    model: str
+    """The model used for the chat completion."""
+
+    object: Literal["chat.completion"]
+    """The object type, which is always `chat.completion`."""
+
+    service_tier: Optional[Literal["auto", "default", "flex", "scale"]] = None
+    """The service tier used for processing the request."""
+
+    system_fingerprint: Optional[str] = None
+    """This fingerprint represents the backend configuration that the model runs with.
+
+    Can be used in conjunction with the `seed` request parameter to understand when
+    backend changes have been made that might impact determinism.
+    """
+
+    usage: Optional[CompletionUsage] = None
+    """Usage statistics for the completion request."""
+
+
+class ChatCompletionExtended(ChatCompletion):
+    message_retrieval_function: Optional[Callable[[Any, "ChatCompletion"], list[ChatCompletionMessage]]] = None
+    config_id: Optional[str] = None
+    pass_filter: Optional[Callable[..., bool]] = None
+    cost: Optional[float] = None
diff --git a/mm_agents/coact/autogen/oai/oai_models/chat_completion_audio.py b/mm_agents/coact/autogen/oai/oai_models/chat_completion_audio.py
new file mode 100644
index 0000000..8f17572
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/chat_completion_audio.py
@@ -0,0 +1,32 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/3e69750d47df4f0759d4a28ddc68e4b38756d9ca/src/openai/types/chat/chat_completion_audio.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+
+from ._models import BaseModel
+
+__all__ = ["ChatCompletionAudio"]
+
+
+class ChatCompletionAudio(BaseModel):
+    id: str
+    """Unique identifier for this audio response."""
+
+    data: str
+    """
+    Base64 encoded audio bytes generated by the model, in the format specified in
+    the request.
+    """
+
+    expires_at: int
+    """
+    The Unix timestamp (in seconds) for when this audio response will no longer be
+    accessible on the server for use in multi-turn conversations.
+    """
+
+    transcript: str
+    """Transcript of the audio generated by the model."""
diff --git a/mm_agents/coact/autogen/oai/oai_models/chat_completion_message.py b/mm_agents/coact/autogen/oai/oai_models/chat_completion_message.py
new file mode 100644
index 0000000..44836df
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/chat_completion_message.py
@@ -0,0 +1,86 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/16a10604fbd0d82c1382b84b417a1d6a2d33a7f1/src/openai/types/chat/chat_completion_message.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from typing import List, Optional
+
+from typing_extensions import Literal
+
+from ._models import BaseModel
+from .chat_completion_audio import ChatCompletionAudio
+from .chat_completion_message_tool_call import ChatCompletionMessageToolCall
+
+__all__ = ["Annotation", "AnnotationURLCitation", "ChatCompletionMessage", "FunctionCall"]
+
+
+class AnnotationURLCitation(BaseModel):
+    end_index: int
+    """The index of the last character of the URL citation in the message."""
+
+    start_index: int
+    """The index of the first character of the URL citation in the message."""
+
+    title: str
+    """The title of the web resource."""
+
+    url: str
+    """The URL of the web resource."""
+
+
+class Annotation(BaseModel):
+    type: Literal["url_citation"]
+    """The type of the URL citation. Always `url_citation`."""
+
+    url_citation: AnnotationURLCitation
+    """A URL citation when using web search."""
+
+
+class FunctionCall(BaseModel):
+    arguments: str
+    """
+    The arguments to call the function with, as generated by the model in JSON
+    format. Note that the model does not always generate valid JSON, and may
+    hallucinate parameters not defined by your function schema. Validate the
+    arguments in your code before calling your function.
+    """
+
+    name: str
+    """The name of the function to call."""
+
+
+class ChatCompletionMessage(BaseModel):
+    content: Optional[str] = None
+    """The contents of the message."""
+
+    refusal: Optional[str] = None
+    """The refusal message generated by the model."""
+
+    role: Literal["assistant"]
+    """The role of the author of this message."""
+
+    annotations: Optional[List[Annotation]] = None
+    """
+    Annotations for the message, when applicable, as when using the
+    [web search tool](https://platform.openai.com/docs/guides/tools-web-search?api-mode=chat).
+    """
+
+    audio: Optional[ChatCompletionAudio] = None
+    """
+    If the audio output modality is requested, this object contains data about the
+    audio response from the model.
+    [Learn more](https://platform.openai.com/docs/guides/audio).
+    """
+
+    function_call: Optional[FunctionCall] = None
+    """Deprecated and replaced by `tool_calls`.
+
+    The name and arguments of a function that should be called, as generated by the
+    model.
+    """
+
+    tool_calls: Optional[List[ChatCompletionMessageToolCall]] = None
+    """The tool calls generated by the model, such as function calls."""
diff --git a/mm_agents/coact/autogen/oai/oai_models/chat_completion_message_tool_call.py b/mm_agents/coact/autogen/oai/oai_models/chat_completion_message_tool_call.py
new file mode 100644
index 0000000..d4c339d
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/chat_completion_message_tool_call.py
@@ -0,0 +1,37 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/3e69750d47df4f0759d4a28ddc68e4b38756d9ca/src/openai/types/chat/chat_completion_message_tool_call.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from typing_extensions import Literal
+
+from ._models import BaseModel
+
+__all__ = ["ChatCompletionMessageToolCall", "Function"]
+
+
+class Function(BaseModel):
+    arguments: str
+    """
+    The arguments to call the function with, as generated by the model in JSON
+    format. Note that the model does not always generate valid JSON, and may
+    hallucinate parameters not defined by your function schema. Validate the
+    arguments in your code before calling your function.
+    """
+
+    name: str
+    """The name of the function to call."""
+
+
+class ChatCompletionMessageToolCall(BaseModel):
+    id: str
+    """The ID of the tool call."""
+
+    function: Function
+    """The function that the model called."""
+
+    type: Literal["function"]
+    """The type of the tool. Currently, only `function` is supported."""
diff --git a/mm_agents/coact/autogen/oai/oai_models/chat_completion_token_logprob.py b/mm_agents/coact/autogen/oai/oai_models/chat_completion_token_logprob.py
new file mode 100644
index 0000000..8357461
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/chat_completion_token_logprob.py
@@ -0,0 +1,63 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/3e69750d47df4f0759d4a28ddc68e4b38756d9ca/src/openai/types/chat/chat_completion_token_logprob.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from typing import List, Optional
+
+from ._models import BaseModel
+
+__all__ = ["ChatCompletionTokenLogprob", "TopLogprob"]
+
+
+class TopLogprob(BaseModel):
+    token: str
+    """The token."""
+
+    bytes: Optional[List[int]] = None
+    """A list of integers representing the UTF-8 bytes representation of the token.
+
+    Useful in instances where characters are represented by multiple tokens and
+    their byte representations must be combined to generate the correct text
+    representation. Can be `null` if there is no bytes representation for the token.
+    """
+
+    logprob: float
+    """The log probability of this token, if it is within the top 20 most likely
+    tokens.
+
+    Otherwise, the value `-9999.0` is used to signify that the token is very
+    unlikely.
+    """
+
+
+class ChatCompletionTokenLogprob(BaseModel):
+    token: str
+    """The token."""
+
+    bytes: Optional[List[int]] = None
+    """A list of integers representing the UTF-8 bytes representation of the token.
+
+    Useful in instances where characters are represented by multiple tokens and
+    their byte representations must be combined to generate the correct text
+    representation. Can be `null` if there is no bytes representation for the token.
+    """
+
+    logprob: float
+    """The log probability of this token, if it is within the top 20 most likely
+    tokens.
+
+    Otherwise, the value `-9999.0` is used to signify that the token is very
+    unlikely.
+    """
+
+    top_logprobs: List[TopLogprob]
+    """List of the most likely tokens and their log probability, at this token
+    position.
+
+    In rare cases, there may be fewer than the number of requested `top_logprobs`
+    returned.
+    """
diff --git a/mm_agents/coact/autogen/oai/oai_models/completion_usage.py b/mm_agents/coact/autogen/oai/oai_models/completion_usage.py
new file mode 100644
index 0000000..7c01c83
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/oai_models/completion_usage.py
@@ -0,0 +1,60 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+# Taken over from https://github.com/openai/openai-python/blob/3e69750d47df4f0759d4a28ddc68e4b38756d9ca/src/openai/types/completion_usage.py
+
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from typing import Optional
+
+from ._models import BaseModel
+
+__all__ = ["CompletionTokensDetails", "CompletionUsage", "PromptTokensDetails"]
+
+
+class CompletionTokensDetails(BaseModel):
+    accepted_prediction_tokens: Optional[int] = None
+    """
+    When using Predicted Outputs, the number of tokens in the prediction that
+    appeared in the completion.
+    """
+
+    audio_tokens: Optional[int] = None
+    """Audio input tokens generated by the model."""
+
+    reasoning_tokens: Optional[int] = None
+    """Tokens generated by the model for reasoning."""
+
+    rejected_prediction_tokens: Optional[int] = None
+    """
+    When using Predicted Outputs, the number of tokens in the prediction that did
+    not appear in the completion. However, like reasoning tokens, these tokens are
+    still counted in the total completion tokens for purposes of billing, output,
+    and context window limits.
+    """
+
+
+class PromptTokensDetails(BaseModel):
+    audio_tokens: Optional[int] = None
+    """Audio input tokens present in the prompt."""
+
+    cached_tokens: Optional[int] = None
+    """Cached tokens present in the prompt."""
+
+
+class CompletionUsage(BaseModel):
+    completion_tokens: int
+    """Number of tokens in the generated completion."""
+
+    prompt_tokens: int
+    """Number of tokens in the prompt."""
+
+    total_tokens: int
+    """Total number of tokens used in the request (prompt + completion)."""
+
+    completion_tokens_details: Optional[CompletionTokensDetails] = None
+    """Breakdown of tokens used in a completion."""
+
+    prompt_tokens_details: Optional[PromptTokensDetails] = None
+    """Breakdown of tokens used in the prompt."""
diff --git a/mm_agents/coact/autogen/oai/ollama.py b/mm_agents/coact/autogen/oai/ollama.py
new file mode 100644
index 0000000..7dde9a0
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/ollama.py
@@ -0,0 +1,643 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Ollama's API.
+
+Example:
+    ```python
+    llm_config = {"config_list": [{"api_type": "ollama", "model": "mistral:7b-instruct-v0.3-q6_K"}]}
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Ollama's python library using: pip install --upgrade ollama
+Install fix-busted-json library: pip install --upgrade fix-busted-json
+
+Resources:
+- https://github.com/ollama/ollama-python
+"""
+
+from __future__ import annotations
+
+import copy
+import json
+import random
+import re
+import time
+import warnings
+from typing import Any, Literal, Optional, Union
+
+from pydantic import BaseModel, Field, HttpUrl
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import FormatterProtocol, should_hide_tools, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    import ollama
+    from fix_busted_json import repair_json
+    from ollama import Client
+
+
+@register_llm_config
+class OllamaLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["ollama"] = "ollama"
+    client_host: Optional[HttpUrl] = None
+    stream: bool = False
+    num_predict: int = Field(
+        default=-1,
+        description="Maximum number of tokens to predict, note: -1 is infinite (default), -2 is fill context.",
+    )
+    num_ctx: int = Field(default=2048)
+    repeat_penalty: float = Field(default=1.1)
+    seed: int = Field(default=0)
+    temperature: float = Field(default=0.8)
+    top_k: int = Field(default=40)
+    top_p: float = Field(default=0.9)
+    hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
+
+    def create_client(self):
+        raise NotImplementedError("OllamaLLMConfigEntry.create_client is not implemented.")
+
+
+class OllamaClient:
+    """Client for Ollama's API."""
+
+    # Defaults for manual tool calling
+    # Instruction is added to the first system message and provides directions to follow a two step
+    # process
+    # 1. (before tools have been called) Return JSON with the functions to call
+    # 2. (directly after tools have been called) Return Text describing the results of the function calls in text format
+
+    # Override using "manual_tool_call_instruction" config parameter
+    TOOL_CALL_MANUAL_INSTRUCTION = (
+        "You are to follow a strict two step process that will occur over "
+        "a number of interactions, so pay attention to what step you are in based on the full "
+        "conversation. We will be taking turns so only do one step at a time so don't perform step "
+        "2 until step 1 is complete and I've told you the result. The first step is to choose one "
+        "or more functions based on the request given and return only JSON with the functions and "
+        "arguments to use. The second step is to analyse the given output of the function and summarise "
+        "it returning only TEXT and not Python or JSON. "
+        "For argument values, be sure numbers aren't strings, they should not have double quotes around them. "
+        "In terms of your response format, for step 1 return only JSON and NO OTHER text, "
+        "for step 2 return only text and NO JSON/Python/Markdown. "
+        'The format for running a function is [{"name": "function_name1", "arguments":{"argument_name": "argument_value"}},{"name": "function_name2", "arguments":{"argument_name": "argument_value"}}] '
+        'Make sure the keys "name" and "arguments" are as described. '
+        "If you don't get the format correct, try again. "
+        "The following functions are available to you:[FUNCTIONS_LIST]"
+    )
+
+    # Appended to the last user message if no tools have been called
+    # Override using "manual_tool_call_step1" config parameter
+    TOOL_CALL_MANUAL_STEP1 = " (proceed with step 1)"
+
+    # Appended to the user message after tools have been executed. Will create a 'user' message if one doesn't exist.
+    # Override using "manual_tool_call_step2" config parameter
+    TOOL_CALL_MANUAL_STEP2 = " (proceed with step 2)"
+
+    def __init__(self, response_format: Optional[Union[BaseModel, dict[str, Any]]] = None, **kwargs):
+        """Note that no api_key or environment variable is required for Ollama."""
+
+        # Store the response format, if provided (for structured outputs)
+        self._response_format: Optional[Union[BaseModel, dict[str, Any]]] = response_format
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Ollama API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        ollama_params = {}
+
+        # Check that we have what we need to use Ollama's API
+        # https://github.com/ollama/ollama/blob/main/docs/api.md#generate-a-completion
+
+        # The main parameters are model, prompt, stream, and options
+        # Options is a dictionary of parameters for the model
+        # There are other, advanced, parameters such as format, system (to override system message), template, raw, etc. - not used
+
+        # We won't enforce the available models
+        ollama_params["model"] = params.get("model")
+        assert ollama_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Ollama model to use."
+        )
+
+        ollama_params["stream"] = validate_parameter(params, "stream", bool, True, False, None, None)
+
+        # Build up the options dictionary
+        # https://github.com/ollama/ollama/blob/main/docs/modelfile.md#valid-parameters-and-values
+        options_dict = {}
+
+        if "num_predict" in params:
+            # Maximum number of tokens to predict, note: -1 is infinite, -2 is fill context, 128 is default
+            options_dict["num_predict"] = validate_parameter(params, "num_predict", int, False, 128, None, None)
+
+        if "num_ctx" in params:
+            # Set size of context window used to generate next token, 2048 is default
+            options_dict["num_ctx"] = validate_parameter(params, "num_ctx", int, False, 2048, None, None)
+
+        if "repeat_penalty" in params:
+            options_dict["repeat_penalty"] = validate_parameter(
+                params, "repeat_penalty", (int, float), False, 1.1, None, None
+            )
+
+        if "seed" in params:
+            options_dict["seed"] = validate_parameter(params, "seed", int, False, 42, None, None)
+
+        if "temperature" in params:
+            options_dict["temperature"] = validate_parameter(
+                params, "temperature", (int, float), False, 0.8, None, None
+            )
+
+        if "top_k" in params:
+            options_dict["top_k"] = validate_parameter(params, "top_k", int, False, 40, None, None)
+
+        if "top_p" in params:
+            options_dict["top_p"] = validate_parameter(params, "top_p", (int, float), False, 0.9, None, None)
+
+        if self._native_tool_calls and self._tools_in_conversation and not self._should_hide_tools:
+            ollama_params["tools"] = params["tools"]
+
+            # Ollama doesn't support streaming with tools natively
+            if ollama_params["stream"] and self._native_tool_calls:
+                warnings.warn(
+                    "Streaming is not supported when using tools and 'Native' tool calling, streaming will be disabled.",
+                    UserWarning,
+                )
+
+                ollama_params["stream"] = False
+
+        if not self._native_tool_calls and self._tools_in_conversation:
+            # For manual tool calling we have injected the available tools into the prompt
+            # and we don't want to force JSON mode
+            ollama_params["format"] = ""  # Don't force JSON for manual tool calling mode
+
+        if len(options_dict) != 0:
+            ollama_params["options"] = options_dict
+
+        # Structured outputs (see https://ollama.com/blog/structured-outputs)
+        if not self._response_format and params.get("response_format"):
+            self._response_format = params["response_format"]
+
+        if self._response_format:
+            if isinstance(self._response_format, dict):
+                ollama_params["format"] = self._response_format
+            else:
+                # Keep self._response_format as a Pydantic model for when process the response
+                ollama_params["format"] = self._response_format.model_json_schema()
+
+        return ollama_params
+
+    @require_optional_import(["ollama", "fix_busted_json"], "ollama")
+    def create(self, params: dict) -> ChatCompletion:
+        messages = params.get("messages", [])
+
+        # Are tools involved in this conversation?
+        self._tools_in_conversation = "tools" in params
+
+        # We provide second-level filtering out of tools to avoid LLMs re-calling tools continuously
+        if self._tools_in_conversation:
+            hide_tools = validate_parameter(
+                params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
+            )
+            self._should_hide_tools = should_hide_tools(messages, params["tools"], hide_tools)
+        else:
+            self._should_hide_tools = False
+
+        # Are we using native Ollama tool calling, otherwise we're doing manual tool calling
+        # We allow the user to decide if they want to use Ollama's tool calling
+        # or for tool calling to be handled manually through text messages
+        # Default is True = Ollama's tool calling
+        self._native_tool_calls = validate_parameter(params, "native_tool_calls", bool, False, True, None, None)
+
+        if not self._native_tool_calls:
+            # Load defaults
+            self._manual_tool_call_instruction = validate_parameter(
+                params, "manual_tool_call_instruction", str, False, self.TOOL_CALL_MANUAL_INSTRUCTION, None, None
+            )
+            self._manual_tool_call_step1 = validate_parameter(
+                params, "manual_tool_call_step1", str, False, self.TOOL_CALL_MANUAL_STEP1, None, None
+            )
+            self._manual_tool_call_step2 = validate_parameter(
+                params, "manual_tool_call_step2", str, False, self.TOOL_CALL_MANUAL_STEP2, None, None
+            )
+
+        # Convert AG2 messages to Ollama messages
+        ollama_messages = self.oai_messages_to_ollama_messages(
+            messages,
+            (
+                params["tools"]
+                if (not self._native_tool_calls and self._tools_in_conversation) and not self._should_hide_tools
+                else None
+            ),
+        )
+
+        # Parse parameters to the Ollama API's parameters
+        ollama_params = self.parse_params(params)
+
+        ollama_params["messages"] = ollama_messages
+
+        # Token counts will be returned
+        prompt_tokens = 0
+        completion_tokens = 0
+        total_tokens = 0
+
+        ans = None
+        if "client_host" in params:
+            # Convert client_host to string from HttpUrl
+            client = Client(host=str(params["client_host"]))
+            response = client.chat(**ollama_params)
+        else:
+            response = ollama.chat(**ollama_params)
+
+        if ollama_params["stream"]:
+            # Read in the chunks as they stream, taking in tool_calls which may be across
+            # multiple chunks if more than one suggested
+            ans = ""
+            for chunk in response:
+                ans = ans + (chunk["message"]["content"] or "")
+
+                if "done_reason" in chunk:
+                    prompt_tokens = chunk.get("prompt_eval_count", 0)
+                    completion_tokens = chunk.get("eval_count", 0)
+                    total_tokens = prompt_tokens + completion_tokens
+        else:
+            # Non-streaming finished
+            ans: str = response["message"]["content"]
+
+            prompt_tokens = response.get("prompt_eval_count", 0)
+            completion_tokens = response.get("eval_count", 0)
+            total_tokens = prompt_tokens + completion_tokens
+
+        if response is not None:
+            # Defaults
+            ollama_finish = "stop"
+            tool_calls = None
+
+            # Id and streaming text into response
+            if ollama_params["stream"]:
+                response_content = ans
+                response_id = chunk["created_at"]
+            else:
+                response_content = response["message"]["content"]
+                response_id = response["created_at"]
+
+            # Process tools in the response
+            if self._tools_in_conversation:
+                if self._native_tool_calls:
+                    if not ollama_params["stream"]:
+                        response_content = response["message"]["content"]
+
+                        # Native tool calling
+                        if "tool_calls" in response["message"]:
+                            ollama_finish = "tool_calls"
+                            tool_calls = []
+                            random_id = random.randint(0, 10000)
+                            for tool_call in response["message"]["tool_calls"]:
+                                tool_calls.append(
+                                    ChatCompletionMessageToolCall(
+                                        id=f"ollama_func_{random_id}",
+                                        function={
+                                            "name": tool_call["function"]["name"],
+                                            "arguments": json.dumps(tool_call["function"]["arguments"]),
+                                        },
+                                        type="function",
+                                    )
+                                )
+
+                                random_id += 1
+
+                elif not self._native_tool_calls:
+                    # Try to convert the response to a tool call object
+                    response_toolcalls = response_to_tool_call(ans)
+
+                    # If we can, then we've got tool call(s)
+                    if response_toolcalls is not None:
+                        ollama_finish = "tool_calls"
+                        tool_calls = []
+                        random_id = random.randint(0, 10000)
+
+                        for json_function in response_toolcalls:
+                            tool_calls.append(
+                                ChatCompletionMessageToolCall(
+                                    id=f"ollama_manual_func_{random_id}",
+                                    function={
+                                        "name": json_function["name"],
+                                        "arguments": (
+                                            json.dumps(json_function["arguments"])
+                                            if "arguments" in json_function
+                                            else "{}"
+                                        ),
+                                    },
+                                    type="function",
+                                )
+                            )
+
+                            random_id += 1
+
+                        # Blank the message content
+                        response_content = ""
+
+            if ollama_finish == "stop":  # noqa: SIM102
+                # Not a tool call, so let's check if we need to process structured output
+                if self._response_format and response_content:
+                    try:
+                        parsed_response = self._convert_json_response(response_content)
+                        response_content = _format_json_response(parsed_response, response_content)
+                    except ValueError as e:
+                        response_content = str(e)
+        else:
+            raise RuntimeError("Failed to get response from Ollama.")
+
+        # Convert response to AG2 response
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=response_content,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=ollama_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response_id,
+            model=ollama_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=total_tokens,
+            ),
+            cost=0,  # Local models, FREE!
+        )
+
+        return response_oai
+
+    def oai_messages_to_ollama_messages(self, messages: list[dict[str, Any]], tools: list) -> list[dict[str, Any]]:
+        """Convert messages from OAI format to Ollama's format.
+        We correct for any specific role orders and types, and convert tools to messages (as Ollama can't use tool messages)
+        """
+        ollama_messages = copy.deepcopy(messages)
+
+        # Remove the name field
+        for message in ollama_messages:
+            if "name" in message:
+                message.pop("name", None)
+
+        # Having a 'system' message on the end does not work well with Ollama, so we change it to 'user'
+        # 'system' messages on the end are typical of the summarisation message: summary_method="reflection_with_llm"
+        if len(ollama_messages) > 1 and ollama_messages[-1]["role"] == "system":
+            ollama_messages[-1]["role"] = "user"
+
+        # Process messages for tool calling manually
+        if tools is not None and not self._native_tool_calls:
+            # 1. We need to append instructions to the starting system message on function calling
+            # 2. If we have not yet called tools we append "step 1 instruction" to the latest user message
+            # 3. If we have already called tools we append "step 2 instruction" to the latest user message
+
+            have_tool_calls = False
+            have_tool_results = False
+            last_tool_result_index = -1
+
+            for i, message in enumerate(ollama_messages):
+                if "tool_calls" in message:
+                    have_tool_calls = True
+                if "tool_call_id" in message:
+                    have_tool_results = True
+                    last_tool_result_index = i
+
+            tool_result_is_last_msg = have_tool_results and last_tool_result_index == len(ollama_messages) - 1
+
+            if ollama_messages[0]["role"] == "system":
+                manual_instruction = self._manual_tool_call_instruction
+
+                # Build a string of the functions available
+                functions_string = ""
+                for function in tools:
+                    functions_string += f"""\n{function}\n"""
+
+                # Replace single quotes with double questions - Not sure why this helps the LLM perform
+                # better, but it seems to. Monitor and remove if not necessary.
+                functions_string = functions_string.replace("'", '"')
+
+                manual_instruction = manual_instruction.replace("[FUNCTIONS_LIST]", functions_string)
+
+                # Update the system message with the instructions and functions
+                ollama_messages[0]["content"] = ollama_messages[0]["content"] + manual_instruction.rstrip()
+
+            # If we are still in the function calling or evaluating process, append the steps instruction
+            if (not have_tool_calls or tool_result_is_last_msg) and ollama_messages[0]["role"] == "system":
+                # NOTE: we require a system message to exist for the manual steps texts
+                # Append the manual step instructions
+                content_to_append = (
+                    self._manual_tool_call_step1 if not have_tool_results else self._manual_tool_call_step2
+                )
+
+                if content_to_append != "":
+                    # Append the relevant tool call instruction to the latest user message
+                    if ollama_messages[-1]["role"] == "user":
+                        ollama_messages[-1]["content"] = ollama_messages[-1]["content"] + content_to_append
+                    else:
+                        ollama_messages.append({"role": "user", "content": content_to_append})
+
+        # Convert tool call and tool result messages to normal text messages for Ollama
+        for i, message in enumerate(ollama_messages):
+            if "tool_calls" in message:
+                # Recommended tool calls
+                content = "Run the following function(s):"
+                for tool_call in message["tool_calls"]:
+                    content = content + "\n" + str(tool_call)
+                ollama_messages[i] = {"role": "assistant", "content": content}
+            if "tool_call_id" in message:
+                # Executed tool results
+                message["result"] = message["content"]
+                del message["content"]
+                del message["role"]
+                content = "The following function was run: " + str(message)
+                ollama_messages[i] = {"role": "user", "content": content}
+
+        # As we are changing messages, let's merge if they have two user messages on the end and the last one is tool call step instructions
+        if (
+            len(ollama_messages) >= 2
+            and not self._native_tool_calls
+            and ollama_messages[-2]["role"] == "user"
+            and ollama_messages[-1]["role"] == "user"
+            and (
+                ollama_messages[-1]["content"] == self._manual_tool_call_step1
+                or ollama_messages[-1]["content"] == self._manual_tool_call_step2
+            )
+        ):
+            ollama_messages[-2]["content"] = ollama_messages[-2]["content"] + ollama_messages[-1]["content"]
+            del ollama_messages[-1]
+
+        # Ensure the last message is a user / system message, if not, add a user message
+        if ollama_messages[-1]["role"] != "user" and ollama_messages[-1]["role"] != "system":
+            ollama_messages.append({"role": "user", "content": "Please continue."})
+
+        return ollama_messages
+
+    def _convert_json_response(self, response: str) -> Any:
+        """Extract and validate JSON response from the output for structured outputs.
+
+        Args:
+            response (str): The response from the API.
+
+        Returns:
+            Any: The parsed JSON response.
+        """
+        if not self._response_format:
+            return response
+
+        try:
+            # Parse JSON and validate against the Pydantic model if Pydantic model was provided
+            if isinstance(self._response_format, dict):
+                return response
+            else:
+                return self._response_format.model_validate_json(response)
+        except Exception as e:
+            raise ValueError(f"Failed to parse response as valid JSON matching the schema for Structured Output: {e!s}")
+
+
+def _format_json_response(response: Any, original_answer: str) -> str:
+    """Formats the JSON response for structured outputs using the format method if it exists."""
+    return response.format() if isinstance(response, FormatterProtocol) else original_answer
+
+
+@require_optional_import("fix_busted_json", "ollama")
+def response_to_tool_call(response_string: str) -> Any:
+    """Attempts to convert the response to an object, aimed to align with function format `[{},{}]`"""
+    # We try and detect the list[dict[str, Any]] format:
+    # Pattern 1 is [{},{}]
+    # Pattern 2 is {} (without the [], so could be a single function call)
+    patterns = [r"\[[\s\S]*?\]", r"\{[\s\S]*\}"]
+
+    for i, pattern in enumerate(patterns):
+        # Search for the pattern in the input string
+        matches = re.findall(pattern, response_string.strip())
+
+        for match in matches:
+            # It has matched, extract it and load it
+            json_str = match.strip()
+            data_object = None
+
+            try:
+                # Attempt to convert it as is
+                data_object = json.loads(json_str)
+            except Exception:
+                try:
+                    # If that fails, attempt to repair it
+
+                    if i == 0:
+                        # Enclose to a JSON object for repairing, which is restored upon fix
+                        fixed_json = repair_json("{'temp':" + json_str + "}")
+                        data_object = json.loads(fixed_json)
+                        data_object = data_object["temp"]
+                    else:
+                        fixed_json = repair_json(json_str)
+                        data_object = json.loads(fixed_json)
+                except json.JSONDecodeError as e:
+                    if e.msg == "Invalid \\escape":
+                        # Handle Mistral/Mixtral trying to escape underlines with \\
+                        try:
+                            json_str = json_str.replace("\\_", "_")
+                            if i == 0:
+                                fixed_json = repair_json("{'temp':" + json_str + "}")
+                                data_object = json.loads(fixed_json)
+                                data_object = data_object["temp"]
+                            else:
+                                fixed_json = repair_json("{'temp':" + json_str + "}")
+                                data_object = json.loads(fixed_json)
+                        except Exception:
+                            pass
+                except Exception:
+                    pass
+
+            if data_object is not None:
+                data_object = _object_to_tool_call(data_object)
+
+                if data_object is not None:
+                    return data_object
+
+    # There's no tool call in the response
+    return None
+
+
+def _object_to_tool_call(data_object: Any) -> list[dict[str, Any]]:
+    """Attempts to convert an object to a valid tool call object List[Dict] and returns it, if it can, otherwise None"""
+    # If it's a dictionary and not a list then wrap in a list
+    if isinstance(data_object, dict):
+        data_object = [data_object]
+
+    # Validate that the data is a list of dictionaries
+    if isinstance(data_object, list) and all(isinstance(item, dict) for item in data_object):
+        # Perfect format, a list of dictionaries
+
+        # Check that each dictionary has at least 'name', optionally 'arguments' and no other keys
+        is_invalid = False
+        for item in data_object:
+            if not is_valid_tool_call_item(item):
+                is_invalid = True
+                break
+
+        # All passed, name and (optionally) arguments exist for all entries.
+        if not is_invalid:
+            return data_object
+    elif isinstance(data_object, list):
+        # If it's a list but the items are not dictionaries, check if they are strings that can be converted to dictionaries
+        data_copy = data_object.copy()
+        is_invalid = False
+        for i, item in enumerate(data_copy):
+            try:
+                new_item = eval(item)
+                if isinstance(new_item, dict):
+                    if is_valid_tool_call_item(new_item):
+                        data_object[i] = new_item
+                    else:
+                        is_invalid = True
+                        break
+                else:
+                    is_invalid = True
+                    break
+            except Exception:
+                is_invalid = True
+                break
+
+        if not is_invalid:
+            return data_object
+
+    return None
+
+
+def is_valid_tool_call_item(call_item: dict) -> bool:
+    """Check that a dictionary item has at least 'name', optionally 'arguments' and no other keys to match a tool call JSON"""
+    if "name" not in call_item or not isinstance(call_item["name"], str):
+        return False
+
+    if set(call_item.keys()) - {"name", "arguments"}:  # noqa: SIM103
+        return False
+
+    return True
diff --git a/mm_agents/coact/autogen/oai/openai_utils.py b/mm_agents/coact/autogen/oai/openai_utils.py
new file mode 100644
index 0000000..2c612e2
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/openai_utils.py
@@ -0,0 +1,881 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import importlib
+import importlib.metadata
+import inspect
+import json
+import logging
+import os
+import re
+import tempfile
+import time
+import warnings
+from copy import deepcopy
+from pathlib import Path
+from typing import TYPE_CHECKING, Any, Optional, Union
+
+from dotenv import find_dotenv, load_dotenv
+from packaging.version import parse
+from pydantic_core import to_jsonable_python
+
+if TYPE_CHECKING:
+    from openai import OpenAI
+    from openai.types.beta.assistant import Assistant
+
+from ..doc_utils import export_module
+from ..llm_config import LLMConfig
+
+NON_CACHE_KEY = [
+    "api_key",
+    "base_url",
+    "api_type",
+    "api_version",
+    "azure_ad_token",
+    "azure_ad_token_provider",
+    "credentials",
+]
+DEFAULT_AZURE_API_VERSION = "2024-02-01"
+
+# The below pricing is for 1K tokens. Whenever there is an update in the LLM's pricing,
+# Please convert it to 1K tokens and update in the below dictionary in the format: (input_token_price, output_token_price).
+OAI_PRICE1K = {
+    # https://openai.com/api/pricing/
+    # o1
+    "o1-preview-2024-09-12": (0.0015, 0.0060),
+    "o1-preview": (0.0015, 0.0060),
+    "o1-mini-2024-09-12": (0.0003, 0.0012),
+    "o1-mini": (0.0003, 0.0012),
+    "o1": (0.0015, 0.0060),
+    "o1-2024-12-17": (0.0015, 0.0060),
+    # o1 pro
+    "o1-pro": (0.15, 0.6),  # $150 / $600!
+    "o1-pro-2025-03-19": (0.15, 0.6),
+    # o3
+    "o3": (0.0011, 0.0044),
+    "o3-mini-2025-01-31": (0.0011, 0.0044),
+    # gpt-4o
+    "gpt-4o": (0.005, 0.015),
+    "gpt-4o-2024-05-13": (0.005, 0.015),
+    "gpt-4o-2024-08-06": (0.0025, 0.01),
+    "gpt-4o-2024-11-20": (0.0025, 0.01),
+    # gpt-4o-mini
+    "gpt-4o-mini": (0.000150, 0.000600),
+    "gpt-4o-mini-2024-07-18": (0.000150, 0.000600),
+    # gpt-4-turbo
+    "gpt-4-turbo-2024-04-09": (0.01, 0.03),
+    # gpt-4
+    "gpt-4": (0.03, 0.06),
+    "gpt-4-32k": (0.06, 0.12),
+    # gpt-4.1
+    "gpt-4.1": (0.002, 0.008),
+    "gpt-4.1-2025-04-14": (0.002, 0.008),
+    # gpt-4.1 mini
+    "gpt-4.1-mini": (0.0004, 0.0016),
+    "gpt-4.1-mini-2025-04-14": (0.0004, 0.0016),
+    # gpt-4.1 nano
+    "gpt-4.1-nano": (0.0001, 0.0004),
+    "gpt-4.1-nano-2025-04-14": (0.0001, 0.0004),
+    # gpt-3.5 turbo
+    "gpt-3.5-turbo": (0.0005, 0.0015),  # default is 0125
+    "gpt-3.5-turbo-0125": (0.0005, 0.0015),  # 16k
+    "gpt-3.5-turbo-instruct": (0.0015, 0.002),
+    # base model
+    "davinci-002": 0.002,
+    "babbage-002": 0.0004,
+    # old model
+    "gpt-4-0125-preview": (0.01, 0.03),
+    "gpt-4-1106-preview": (0.01, 0.03),
+    "gpt-4-1106-vision-preview": (0.01, 0.03),  # TODO: support vision pricing of images
+    "gpt-3.5-turbo-1106": (0.001, 0.002),
+    "gpt-3.5-turbo-0613": (0.0015, 0.002),
+    # "gpt-3.5-turbo-16k": (0.003, 0.004),
+    "gpt-3.5-turbo-16k-0613": (0.003, 0.004),
+    "gpt-3.5-turbo-0301": (0.0015, 0.002),
+    "text-ada-001": 0.0004,
+    "text-babbage-001": 0.0005,
+    "text-curie-001": 0.002,
+    "code-cushman-001": 0.024,
+    "code-davinci-002": 0.1,
+    "text-davinci-002": 0.02,
+    "text-davinci-003": 0.02,
+    "gpt-4-0314": (0.03, 0.06),  # deprecate in Sep
+    "gpt-4-32k-0314": (0.06, 0.12),  # deprecate in Sep
+    "gpt-4-0613": (0.03, 0.06),
+    "gpt-4-32k-0613": (0.06, 0.12),
+    "gpt-4-turbo-preview": (0.01, 0.03),
+    # https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/#pricing
+    "gpt-35-turbo": (0.0005, 0.0015),  # what's the default? using 0125 here.
+    "gpt-35-turbo-0125": (0.0005, 0.0015),
+    "gpt-35-turbo-instruct": (0.0015, 0.002),
+    "gpt-35-turbo-1106": (0.001, 0.002),
+    "gpt-35-turbo-0613": (0.0015, 0.002),
+    "gpt-35-turbo-0301": (0.0015, 0.002),
+    "gpt-35-turbo-16k": (0.003, 0.004),
+    "gpt-35-turbo-16k-0613": (0.003, 0.004),
+    # deepseek
+    "deepseek-chat": (0.00027, 0.0011),
+}
+
+
+def get_key(config: dict[str, Any]) -> str:
+    """Get a unique identifier of a configuration.
+
+    Args:
+        config (dict or list): A configuration.
+
+    Returns:
+        tuple: A unique identifier which can be used as a key for a dict.
+    """
+    copied = False
+    for key in NON_CACHE_KEY:
+        if key in config:
+            config, copied = config.copy() if not copied else config, True
+            config.pop(key)
+    return to_jsonable_python(config)  # type: ignore [no-any-return]
+
+
+def is_valid_api_key(api_key: str) -> bool:
+    """Determine if input is valid OpenAI API key. As of 2024-09-24 there's no official definition of the key structure
+    so we will allow anything starting with "sk-" and having at least 48 alphanumeric (plus underscore and dash) characters.
+    Keys are known to start with "sk-", "sk-proj", "sk-None", and "sk-svcaat"
+
+    Args:
+        api_key (str): An input string to be validated.
+
+    Returns:
+        bool: A boolean that indicates if input is valid OpenAI API key.
+    """
+    api_key_re = re.compile(r"^sk-[A-Za-z0-9_-]{48,}$")
+    return bool(re.fullmatch(api_key_re, api_key))
+
+
+@export_module("autogen")
+def get_config_list(
+    api_keys: list[str],
+    base_urls: Optional[list[str]] = None,
+    api_type: Optional[str] = None,
+    api_version: Optional[str] = None,
+) -> list[dict[str, Any]]:
+    """Get a list of configs for OpenAI API client.
+
+    Args:
+        api_keys (list): The api keys for openai api calls.
+        base_urls (list, optional): The api bases for openai api calls. If provided, should match the length of api_keys.
+        api_type (str, optional): The api type for openai api calls.
+        api_version (str, optional): The api version for openai api calls.
+
+    Returns:
+        list: A list of configs for OepnAI API calls.
+
+    Example:
+    ```python
+    # Define a list of API keys
+    api_keys = ["key1", "key2", "key3"]
+
+    # Optionally, define a list of base URLs corresponding to each API key
+    base_urls = ["https://api.service1.com", "https://api.service2.com", "https://api.service3.com"]
+
+    # Optionally, define the API type and version if they are common for all keys
+    api_type = "azure"
+    api_version = "2024-02-01"
+
+    # Call the get_config_list function to get a list of configuration dictionaries
+    config_list = get_config_list(api_keys, base_urls, api_type, api_version)
+    ```
+
+    """
+    if base_urls is not None:
+        assert len(api_keys) == len(base_urls), "The length of api_keys must match the length of base_urls"
+    config_list = []
+    for i, api_key in enumerate(api_keys):
+        if not api_key.strip():
+            continue
+        config = {"api_key": api_key}
+        if base_urls:
+            config["base_url"] = base_urls[i]
+        if api_type:
+            config["api_type"] = api_type
+        if api_version:
+            config["api_version"] = api_version
+        config_list.append(config)
+    return config_list
+
+
+@export_module("autogen")
+def get_first_llm_config(
+    llm_config: Union[LLMConfig, dict[str, Any]],
+) -> dict[str, Any]:
+    """Get the first LLM config from the given LLM config.
+
+    Args:
+        llm_config (dict): The LLM config.
+
+    Returns:
+        dict: The first LLM config.
+
+    Raises:
+        ValueError: If the LLM config is invalid.
+    """
+    llm_config = deepcopy(llm_config)
+    if "config_list" not in llm_config:
+        if "model" in llm_config:
+            return llm_config  # type: ignore [return-value]
+        raise ValueError("llm_config must be a valid config dictionary.")
+
+    if len(llm_config["config_list"]) == 0:
+        raise ValueError("Config list must contain at least one config.")
+
+    to_return = llm_config["config_list"][0]
+    return to_return if isinstance(to_return, dict) else to_return.model_dump()  # type: ignore [no-any-return]
+
+
+@export_module("autogen")
+def config_list_openai_aoai(
+    key_file_path: Optional[str] = ".",
+    openai_api_key_file: Optional[str] = "key_openai.txt",
+    aoai_api_key_file: Optional[str] = "key_aoai.txt",
+    openai_api_base_file: Optional[str] = "base_openai.txt",
+    aoai_api_base_file: Optional[str] = "base_aoai.txt",
+    exclude: Optional[str] = None,
+) -> list[dict[str, Any]]:
+    """Get a list of configs for OpenAI API client (including Azure or local model deployments that support OpenAI's chat completion API).
+
+    This function constructs configurations by reading API keys and base URLs from environment variables or text files.
+    It supports configurations for both OpenAI and Azure OpenAI services, allowing for the exclusion of one or the other.
+    When text files are used, the environment variables will be overwritten.
+    To prevent text files from being used, set the corresponding file name to None.
+    Or set key_file_path to None to disallow reading from text files.
+
+    Args:
+        key_file_path (str, optional): The directory path where the API key files are located. Defaults to the current directory.
+        openai_api_key_file (str, optional): The filename containing the OpenAI API key. Defaults to 'key_openai.txt'.
+        aoai_api_key_file (str, optional): The filename containing the Azure OpenAI API key. Defaults to 'key_aoai.txt'.
+        openai_api_base_file (str, optional): The filename containing the OpenAI API base URL. Defaults to 'base_openai.txt'.
+        aoai_api_base_file (str, optional): The filename containing the Azure OpenAI API base URL. Defaults to 'base_aoai.txt'.
+        exclude (str, optional): The API type to exclude from the configuration list. Can be 'openai' or 'aoai'. Defaults to None.
+
+    Returns:
+        List[Dict]: A list of configuration dictionaries. Each dictionary contains keys for 'api_key',
+            and optionally 'base_url', 'api_type', and 'api_version'.
+
+    Raises:
+        FileNotFoundError: If the specified key files are not found and the corresponding API key is not set in the environment variables.
+
+    Example:
+        # To generate configurations excluding Azure OpenAI:
+        configs = config_list_openai_aoai(exclude='aoai')
+
+    File samples:
+        - key_aoai.txt
+
+        ```
+        aoai-12345abcdef67890ghijklmnopqr
+        aoai-09876zyxwvuts54321fedcba
+        ```
+
+        - base_aoai.txt
+
+        ```
+        https://api.azure.com/v1
+        https://api.azure2.com/v1
+        ```
+
+    Notes:
+        - The function checks for API keys and base URLs in the following environment variables: 'OPENAI_API_KEY', 'AZURE_OPENAI_API_KEY',
+          'OPENAI_API_BASE' and 'AZURE_OPENAI_API_BASE'. If these are not found, it attempts to read from the specified files in the
+          'key_file_path' directory.
+        - The API version for Azure configurations is set to DEFAULT_AZURE_API_VERSION by default.
+        - If 'exclude' is set to 'openai', only Azure OpenAI configurations are returned, and vice versa.
+        - The function assumes that the API keys and base URLs in the environment variables are separated by new lines if there are
+          multiple entries.
+    """
+    if exclude != "openai" and key_file_path is not None:
+        # skip if key_file_path is None
+        if openai_api_key_file is not None:
+            # skip if openai_api_key_file is None
+            try:
+                with open(f"{key_file_path}/{openai_api_key_file}") as key_file:
+                    os.environ["OPENAI_API_KEY"] = key_file.read().strip()
+            except FileNotFoundError:
+                logging.info(
+                    "OPENAI_API_KEY is not found in os.environ "
+                    "and key_openai.txt is not found in the specified path. You can specify the api_key in the config_list."
+                )
+        if openai_api_base_file is not None:
+            # skip if openai_api_base_file is None
+            try:
+                with open(f"{key_file_path}/{openai_api_base_file}") as key_file:
+                    os.environ["OPENAI_API_BASE"] = key_file.read().strip()
+            except FileNotFoundError:
+                logging.info(
+                    "OPENAI_API_BASE is not found in os.environ "
+                    "and base_openai.txt is not found in the specified path. You can specify the base_url in the config_list."
+                )
+    if exclude != "aoai" and key_file_path is not None:
+        # skip if key_file_path is None
+        if aoai_api_key_file is not None:
+            try:
+                with open(f"{key_file_path}/{aoai_api_key_file}") as key_file:
+                    os.environ["AZURE_OPENAI_API_KEY"] = key_file.read().strip()
+            except FileNotFoundError:
+                logging.info(
+                    "AZURE_OPENAI_API_KEY is not found in os.environ "
+                    "and key_aoai.txt is not found in the specified path. You can specify the api_key in the config_list."
+                )
+        if aoai_api_base_file is not None:
+            try:
+                with open(f"{key_file_path}/{aoai_api_base_file}") as key_file:
+                    os.environ["AZURE_OPENAI_API_BASE"] = key_file.read().strip()
+            except FileNotFoundError:
+                logging.info(
+                    "AZURE_OPENAI_API_BASE is not found in os.environ "
+                    "and base_aoai.txt is not found in the specified path. You can specify the base_url in the config_list."
+                )
+    aoai_config = (
+        get_config_list(
+            # Assuming Azure OpenAI api keys in os.environ["AZURE_OPENAI_API_KEY"], in separated lines
+            api_keys=os.environ.get("AZURE_OPENAI_API_KEY", "").split("\n"),
+            # Assuming Azure OpenAI api bases in os.environ["AZURE_OPENAI_API_BASE"], in separated lines
+            base_urls=os.environ.get("AZURE_OPENAI_API_BASE", "").split("\n"),
+            api_type="azure",
+            api_version=DEFAULT_AZURE_API_VERSION,
+        )
+        if exclude != "aoai"
+        else []
+    )
+    # process openai base urls
+    base_urls_env_var = os.environ.get("OPENAI_API_BASE", None)
+    base_urls = base_urls_env_var if base_urls_env_var is None else base_urls_env_var.split("\n")
+    openai_config = (
+        get_config_list(
+            # Assuming OpenAI API_KEY in os.environ["OPENAI_API_KEY"]
+            api_keys=os.environ.get("OPENAI_API_KEY", "").split("\n"),
+            base_urls=base_urls,
+        )
+        if exclude != "openai"
+        else []
+    )
+    config_list = openai_config + aoai_config
+    return config_list
+
+
+@export_module("autogen")
+def config_list_from_models(
+    key_file_path: Optional[str] = ".",
+    openai_api_key_file: Optional[str] = "key_openai.txt",
+    aoai_api_key_file: Optional[str] = "key_aoai.txt",
+    aoai_api_base_file: Optional[str] = "base_aoai.txt",
+    exclude: Optional[str] = None,
+    model_list: Optional[list[str]] = None,
+) -> list[dict[str, Any]]:
+    """Get a list of configs for API calls with models specified in the model list.
+
+    This function extends `config_list_openai_aoai` by allowing to clone its' out for each of the models provided.
+    Each configuration will have a 'model' key with the model name as its value. This is particularly useful when
+    all endpoints have same set of models.
+
+    Args:
+        key_file_path (str, optional): The path to the key files.
+        openai_api_key_file (str, optional): The file name of the OpenAI API key.
+        aoai_api_key_file (str, optional): The file name of the Azure OpenAI API key.
+        aoai_api_base_file (str, optional): The file name of the Azure OpenAI API base.
+        exclude (str, optional): The API type to exclude, "openai" or "aoai".
+        model_list (list, optional): The list of model names to include in the configs.
+
+    Returns:
+        list: A list of configs for OpenAI API calls, each including model information.
+
+    Example:
+    ```python
+    # Define the path where the API key files are located
+    key_file_path = "/path/to/key/files"
+
+    # Define the file names for the OpenAI and Azure OpenAI API keys and bases
+    openai_api_key_file = "key_openai.txt"
+    aoai_api_key_file = "key_aoai.txt"
+    aoai_api_base_file = "base_aoai.txt"
+
+    # Define the list of models for which to create configurations
+    model_list = ["gpt-4", "gpt-3.5-turbo"]
+
+    # Call the function to get a list of configuration dictionaries
+    config_list = config_list_from_models(
+        key_file_path=key_file_path,
+        openai_api_key_file=openai_api_key_file,
+        aoai_api_key_file=aoai_api_key_file,
+        aoai_api_base_file=aoai_api_base_file,
+        model_list=model_list,
+    )
+
+    # The `config_list` will contain configurations for the specified models, for example:
+    # [
+    #     {'api_key': '...', 'base_url': 'https://api.openai.com', 'model': 'gpt-4'},
+    #     {'api_key': '...', 'base_url': 'https://api.openai.com', 'model': 'gpt-3.5-turbo'}
+    # ]
+    ```
+    """
+    config_list = config_list_openai_aoai(
+        key_file_path=key_file_path,
+        openai_api_key_file=openai_api_key_file,
+        aoai_api_key_file=aoai_api_key_file,
+        aoai_api_base_file=aoai_api_base_file,
+        exclude=exclude,
+    )
+    if model_list:
+        config_list = [{**config, "model": model} for model in model_list for config in config_list]
+    return config_list
+
+
+@export_module("autogen")
+def config_list_gpt4_gpt35(
+    key_file_path: Optional[str] = ".",
+    openai_api_key_file: Optional[str] = "key_openai.txt",
+    aoai_api_key_file: Optional[str] = "key_aoai.txt",
+    aoai_api_base_file: Optional[str] = "base_aoai.txt",
+    exclude: Optional[str] = None,
+) -> list[dict[str, Any]]:
+    """Get a list of configs for 'gpt-4' followed by 'gpt-3.5-turbo' API calls.
+
+    Args:
+        key_file_path (str, optional): The path to the key files.
+        openai_api_key_file (str, optional): The file name of the openai api key.
+        aoai_api_key_file (str, optional): The file name of the azure openai api key.
+        aoai_api_base_file (str, optional): The file name of the azure openai api base.
+        exclude (str, optional): The api type to exclude, "openai" or "aoai".
+
+    Returns:
+        list: A list of configs for openai api calls.
+    """
+    return config_list_from_models(
+        key_file_path,
+        openai_api_key_file,
+        aoai_api_key_file,
+        aoai_api_base_file,
+        exclude,
+        model_list=["gpt-4", "gpt-3.5-turbo"],
+    )
+
+
+@export_module("autogen")
+def filter_config(
+    config_list: list[dict[str, Any]],
+    filter_dict: Optional[dict[str, Union[list[Union[str, None]], set[Union[str, None]]]]],
+    exclude: bool = False,
+) -> list[dict[str, Any]]:
+    """This function filters `config_list` by checking each configuration dictionary against the criteria specified in
+    `filter_dict`. A configuration dictionary is retained if for every key in `filter_dict`, see example below.
+
+    Args:
+        config_list (list of dict): A list of configuration dictionaries to be filtered.
+        filter_dict (dict): A dictionary representing the filter criteria, where each key is a
+                            field name to check within the configuration dictionaries, and the
+                            corresponding value is a list of acceptable values for that field.
+                            If the configuration's field's value is not a list, then a match occurs
+                            when it is found in the list of acceptable values. If the configuration's
+                            field's value is a list, then a match occurs if there is a non-empty
+                            intersection with the acceptable values.
+        exclude (bool): If False (the default value), configs that match the filter will be included in the returned
+            list. If True, configs that match the filter will be excluded in the returned list.
+
+    Returns:
+        list of dict: A list of configuration dictionaries that meet all the criteria specified
+                      in `filter_dict`.
+
+    Example:
+        ```python
+        # Example configuration list with various models and API types
+        configs = [
+            {"model": "gpt-3.5-turbo"},
+            {"model": "gpt-4"},
+            {"model": "gpt-3.5-turbo", "api_type": "azure"},
+            {"model": "gpt-3.5-turbo", "tags": ["gpt35_turbo", "gpt-35-turbo"]},
+        ]
+        # Define filter criteria to select configurations for the 'gpt-3.5-turbo' model
+        # that are also using the 'azure' API type
+        filter_criteria = {
+            "model": ["gpt-3.5-turbo"],  # Only accept configurations for 'gpt-3.5-turbo'
+            "api_type": ["azure"],  # Only accept configurations for 'azure' API type
+        }
+        # Apply the filter to the configuration list
+        filtered_configs = filter_config(configs, filter_criteria)
+        # The resulting `filtered_configs` will be:
+        # [{'model': 'gpt-3.5-turbo', 'api_type': 'azure', ...}]
+        # Define a filter to select a given tag
+        filter_criteria = {
+            "tags": ["gpt35_turbo"],
+        }
+        # Apply the filter to the configuration list
+        filtered_configs = filter_config(configs, filter_criteria)
+        # The resulting `filtered_configs` will be:
+        # [{'model': 'gpt-3.5-turbo', 'tags': ['gpt35_turbo', 'gpt-35-turbo']}]
+        ```
+    Note:
+        - If `filter_dict` is empty or None, no filtering is applied and `config_list` is returned as is.
+        - If a configuration dictionary in `config_list` does not contain a key specified in `filter_dict`,
+          it is considered a non-match and is excluded from the result.
+        - If the list of acceptable values for a key in `filter_dict` includes None, then configuration
+          dictionaries that do not have that key will also be considered a match.
+
+    """
+    if inspect.stack()[1].function != "where":
+        warnings.warn(
+            "filter_config is deprecated and will be removed in a future release. "
+            'Please use the "autogen.LLMConfig.from_json(path="OAI_CONFIG_LIST").where(model="gpt-4o")" method instead.',
+            DeprecationWarning,
+        )
+
+    if filter_dict:
+        return [
+            item
+            for item in config_list
+            if all(_satisfies_criteria(item.get(key), values) != exclude for key, values in filter_dict.items())
+        ]
+    return config_list
+
+
+def _satisfies_criteria(value: Any, criteria_values: Any) -> bool:
+    if value is None:
+        return False
+
+    if isinstance(value, list):
+        return bool(set(value) & set(criteria_values))  # Non-empty intersection
+    else:
+        # In filter_dict, filter could be either a list of values or a single value.
+        # For example, filter_dict = {"model": ["gpt-3.5-turbo"]} or {"model": "gpt-3.5-turbo"}
+        if isinstance(criteria_values, list):
+            return value in criteria_values
+        return bool(value == criteria_values)
+
+
+@export_module("autogen")
+def config_list_from_json(
+    env_or_file: str,
+    file_location: Optional[str] = "",
+    filter_dict: Optional[dict[str, Union[list[Union[str, None]], set[Union[str, None]]]]] = None,
+) -> list[dict[str, Any]]:
+    """Retrieves a list of API configurations from a JSON stored in an environment variable or a file.
+
+    This function attempts to parse JSON data from the given `env_or_file` parameter. If `env_or_file` is an
+    environment variable containing JSON data, it will be used directly. Otherwise, it is assumed to be a filename,
+    and the function will attempt to read the file from the specified `file_location`.
+
+    The `filter_dict` parameter allows for filtering the configurations based on specified criteria. Each key in the
+    `filter_dict` corresponds to a field in the configuration dictionaries, and the associated value is a list or set
+    of acceptable values for that field. If a field is missing in a configuration and `None` is included in the list
+    of acceptable values for that field, the configuration will still be considered a match.
+
+    Args:
+        env_or_file (str): The name of the environment variable, the filename, or the environment variable of the filename
+            that containing the JSON data.
+        file_location (str, optional): The directory path where the file is located, if `env_or_file` is a filename.
+        filter_dict (dict, optional): A dictionary specifying the filtering criteria for the configurations, with
+            keys representing field names and values being lists or sets of acceptable values for those fields.
+
+    Example:
+    ```python
+    # Suppose we have an environment variable 'CONFIG_JSON' with the following content:
+    # '[{"model": "gpt-3.5-turbo", "api_type": "azure"}, {"model": "gpt-4"}]'
+
+    # We can retrieve a filtered list of configurations like this:
+    filter_criteria = {"model": ["gpt-3.5-turbo"]}
+    configs = config_list_from_json("CONFIG_JSON", filter_dict=filter_criteria)
+    # The 'configs' variable will now contain only the configurations that match the filter criteria.
+    ```
+
+    Returns:
+        List[Dict]: A list of configuration dictionaries that match the filtering criteria specified in `filter_dict`.
+
+    Raises:
+        FileNotFoundError: if env_or_file is neither found as an environment variable nor a file
+    """
+    if inspect.stack()[1].function != "from_json":
+        warnings.warn(
+            "config_list_from_json is deprecated and will be removed in a future release. "
+            'Please use the "autogen.LLMConfig.from_json(path="OAI_CONFIG_LIST")" method instead.',
+            DeprecationWarning,
+        )
+
+    env_str = os.environ.get(env_or_file)
+
+    if env_str:
+        # The environment variable exists. We should use information from it.
+        if os.path.exists(env_str):
+            # It is a file location, and we need to load the json from the file.
+            with open(env_str) as file:
+                json_str = file.read()
+        else:
+            # Else, it should be a JSON string by itself.
+            json_str = env_str
+        config_list = json.loads(json_str)
+    else:
+        # The environment variable does not exist.
+        # So, `env_or_file` is a filename. We should use the file location.
+        config_list_path = os.path.join(file_location, env_or_file) if file_location is not None else env_or_file
+
+        with open(config_list_path) as json_file:
+            config_list = json.load(json_file)
+
+    config_list = filter_config(config_list, filter_dict)
+
+    return filter_config(config_list, filter_dict)
+
+
+def get_config(
+    api_key: Optional[str],
+    base_url: Optional[str] = None,
+    api_type: Optional[str] = None,
+    api_version: Optional[str] = None,
+) -> dict[str, Any]:
+    """Constructs a configuration dictionary for a single model with the provided API configurations.
+
+    Example:
+    ```python
+    config = get_config(api_key="sk-abcdef1234567890", base_url="https://api.openai.com", api_version="v1")
+    # The 'config' variable will now contain:
+    # {
+    #     "api_key": "sk-abcdef1234567890",
+    #     "base_url": "https://api.openai.com",
+    #     "api_version": "v1"
+    # }
+    ```
+
+    Args:
+        api_key (str): The API key for authenticating API requests.
+        base_url (Optional[str]): The base URL of the API. If not provided, defaults to None.
+        api_type (Optional[str]): The type of API. If not provided, defaults to None.
+        api_version (Optional[str]): The version of the API. If not provided, defaults to None.
+
+    Returns:
+        Dict: A dictionary containing the provided API configurations.
+    """
+    config = {"api_key": api_key}
+    if base_url:
+        config["base_url"] = os.getenv(base_url, default=base_url)
+    if api_type:
+        config["api_type"] = os.getenv(api_type, default=api_type)
+    if api_version:
+        config["api_version"] = os.getenv(api_version, default=api_version)
+    return config
+
+
+@export_module("autogen")
+def config_list_from_dotenv(
+    dotenv_file_path: Optional[str] = None,
+    model_api_key_map: Optional[dict[str, Any]] = None,
+    filter_dict: Optional[dict[str, Union[list[Union[str, None]], set[Union[str, None]]]]] = None,
+) -> list[dict[str, Union[str, set[str]]]]:
+    """Load API configurations from a specified .env file or environment variables and construct a list of configurations.
+
+    This function will:
+    - Load API keys from a provided .env file or from existing environment variables.
+    - Create a configuration dictionary for each model using the API keys and additional configurations.
+    - Filter and return the configurations based on provided filters.
+
+    model_api_key_map will default to `{"gpt-4": "OPENAI_API_KEY", "gpt-3.5-turbo": "OPENAI_API_KEY"}` if none
+
+    Args:
+        dotenv_file_path (str, optional): The path to the .env file. Defaults to None.
+        model_api_key_map (str/dict, optional): A dictionary mapping models to their API key configurations.
+                                           If a string is provided as configuration, it is considered as an environment
+                                           variable name storing the API key.
+                                           If a dict is provided, it should contain at least 'api_key_env_var' key,
+                                           and optionally other API configurations like 'base_url', 'api_type', and 'api_version'.
+                                           Defaults to a basic map with 'gpt-4' and 'gpt-3.5-turbo' mapped to 'OPENAI_API_KEY'.
+        filter_dict (dict, optional): A dictionary containing the models to be loaded.
+                                      Containing a 'model' key mapped to a set of model names to be loaded.
+                                      Defaults to None, which loads all found configurations.
+
+    Returns:
+        List[Dict[str, Union[str, Set[str]]]]: A list of configuration dictionaries for each model.
+
+    Raises:
+        FileNotFoundError: If the specified .env file does not exist.
+        TypeError: If an unsupported type of configuration is provided in model_api_key_map.
+    """
+    if dotenv_file_path:
+        dotenv_path = Path(dotenv_file_path)
+        if dotenv_path.exists():
+            load_dotenv(dotenv_path)
+        else:
+            logging.warning(f"The specified .env file {dotenv_path} does not exist.")
+    else:
+        dotenv_path_str = find_dotenv()
+        if not dotenv_path_str:
+            logging.warning("No .env file found. Loading configurations from environment variables.")
+        dotenv_path = Path(dotenv_path_str)
+        load_dotenv(dotenv_path)
+
+    # Ensure the model_api_key_map is not None to prevent TypeErrors during key assignment.
+    model_api_key_map = model_api_key_map or {}
+
+    # Ensure default models are always considered
+    default_models = ["gpt-4", "gpt-3.5-turbo"]
+
+    for model in default_models:
+        # Only assign default API key if the model is not present in the map.
+        # If model is present but set to invalid/empty, do not overwrite.
+        if model not in model_api_key_map:
+            model_api_key_map[model] = "OPENAI_API_KEY"
+
+    env_var = []
+    # Loop over the models and create configuration dictionaries
+    for model, config in model_api_key_map.items():
+        if isinstance(config, str):
+            api_key_env_var = config
+            config_dict = get_config(api_key=os.getenv(api_key_env_var))
+        elif isinstance(config, dict):
+            api_key = os.getenv(config.get("api_key_env_var", "OPENAI_API_KEY"))
+            config_without_key_var = {k: v for k, v in config.items() if k != "api_key_env_var"}
+            config_dict = get_config(api_key=api_key, **config_without_key_var)
+        else:
+            logging.warning(f"Unsupported type {type(config)} for model {model} configuration")
+
+        if not config_dict["api_key"] or config_dict["api_key"].strip() == "":
+            logging.warning(
+                f"API key not found or empty for model {model}. Please ensure path to .env file is correct."
+            )
+            continue  # Skip this configuration and continue with the next
+
+        # Add model to the configuration and append to the list
+        config_dict["model"] = model
+        env_var.append(config_dict)
+
+    fd, temp_name = tempfile.mkstemp()
+    try:
+        with os.fdopen(fd, "w+") as temp:
+            env_var_str = json.dumps(env_var)
+            temp.write(env_var_str)
+            temp.flush()
+
+            # Assuming config_list_from_json is a valid function from your code
+            config_list = config_list_from_json(env_or_file=temp_name, filter_dict=filter_dict)
+    finally:
+        # The file is deleted after using its name (to prevent windows build from breaking)
+        os.remove(temp_name)
+
+    if len(config_list) == 0:
+        logging.error("No configurations loaded.")
+        return []
+
+    logging.info(f"Models available: {[config['model'] for config in config_list]}")
+    return config_list
+
+
+def retrieve_assistants_by_name(client: "OpenAI", name: str) -> list["Assistant"]:
+    """Return the assistants with the given name from OAI assistant API"""
+    assistants = client.beta.assistants.list()
+    candidate_assistants = []
+    for assistant in assistants.data:
+        if assistant.name == name:
+            candidate_assistants.append(assistant)
+    return candidate_assistants
+
+
+def detect_gpt_assistant_api_version() -> str:
+    """Detect the openai assistant API version"""
+    oai_version = importlib.metadata.version("openai")
+    return "v1" if parse(oai_version) < parse("1.21") else "v2"
+
+
+def create_gpt_vector_store(client: "OpenAI", name: str, fild_ids: list[str]) -> Any:
+    """Create a openai vector store for gpt assistant"""
+    try:
+        vector_store = client.vector_stores.create(name=name)
+    except Exception as e:
+        raise AttributeError(f"Failed to create vector store, please install the latest OpenAI python package: {e}")
+
+    # poll the status of the file batch for completion.
+    batch = client.vector_stores.file_batches.create_and_poll(vector_store_id=vector_store.id, file_ids=fild_ids)
+
+    if batch.status == "in_progress":
+        time.sleep(1)
+        logging.debug(f"file batch status: {batch.file_counts}")
+        batch = client.vector_stores.file_batches.poll(vector_store_id=vector_store.id, batch_id=batch.id)
+
+    if batch.status == "completed":
+        return vector_store
+
+    raise ValueError(f"Failed to upload files to vector store {vector_store.id}:{batch.status}")
+
+
+def create_gpt_assistant(
+    client: "OpenAI", name: str, instructions: str, model: str, assistant_config: dict[str, Any]
+) -> "Assistant":
+    """Create a openai gpt assistant"""
+    assistant_create_kwargs = {}
+    gpt_assistant_api_version = detect_gpt_assistant_api_version()
+    tools = assistant_config.get("tools", [])
+
+    if gpt_assistant_api_version == "v2":
+        tool_resources = assistant_config.get("tool_resources", {})
+        file_ids = assistant_config.get("file_ids")
+        if tool_resources.get("file_search") is not None and file_ids is not None:
+            raise ValueError(
+                "Cannot specify both `tool_resources['file_search']` tool and `file_ids` in the assistant config."
+            )
+
+        # Designed for backwards compatibility for the V1 API
+        # Instead of V1 AssistantFile, files are attached to Assistants using the tool_resources object.
+        for tool in tools:
+            if tool["type"] == "retrieval":
+                tool["type"] = "file_search"
+                if file_ids is not None:
+                    # create a vector store for the file search tool
+                    vs = create_gpt_vector_store(client, f"{name}-vectorestore", file_ids)
+                    tool_resources["file_search"] = {
+                        "vector_store_ids": [vs.id],
+                    }
+            elif tool["type"] == "code_interpreter" and file_ids is not None:
+                tool_resources["code_interpreter"] = {
+                    "file_ids": file_ids,
+                }
+
+        assistant_create_kwargs["tools"] = tools
+        if len(tool_resources) > 0:
+            assistant_create_kwargs["tool_resources"] = tool_resources
+    else:
+        # not support forwards compatibility
+        if "tool_resources" in assistant_config:
+            raise ValueError("`tool_resources` argument are not supported in the openai assistant V1 API.")
+        if any(tool["type"] == "file_search" for tool in tools):
+            raise ValueError(
+                "`file_search` tool are not supported in the openai assistant V1 API, please use `retrieval`."
+            )
+        assistant_create_kwargs["tools"] = tools
+        assistant_create_kwargs["file_ids"] = assistant_config.get("file_ids", [])
+
+    logging.info(f"Creating assistant with config: {assistant_create_kwargs}")
+    return client.beta.assistants.create(name=name, instructions=instructions, model=model, **assistant_create_kwargs)
+
+
+def update_gpt_assistant(client: "OpenAI", assistant_id: str, assistant_config: dict[str, Any]) -> "Assistant":
+    """Update openai gpt assistant"""
+    gpt_assistant_api_version = detect_gpt_assistant_api_version()
+    assistant_update_kwargs = {}
+
+    if assistant_config.get("tools") is not None:
+        assistant_update_kwargs["tools"] = assistant_config["tools"]
+
+    if assistant_config.get("instructions") is not None:
+        assistant_update_kwargs["instructions"] = assistant_config["instructions"]
+
+    if gpt_assistant_api_version == "v2":
+        if assistant_config.get("tool_resources") is not None:
+            assistant_update_kwargs["tool_resources"] = assistant_config["tool_resources"]
+    else:
+        if assistant_config.get("file_ids") is not None:
+            assistant_update_kwargs["file_ids"] = assistant_config["file_ids"]
+
+    return client.beta.assistants.update(assistant_id=assistant_id, **assistant_update_kwargs)
+
+
+def _satisfies(config_value: Any, acceptable_values: Any) -> bool:
+    if isinstance(config_value, list):
+        return bool(set(config_value) & set(acceptable_values))  # Non-empty intersection
+    else:
+        return config_value in acceptable_values
diff --git a/mm_agents/coact/autogen/oai/together.py b/mm_agents/coact/autogen/oai/together.py
new file mode 100644
index 0000000..9086911
--- /dev/null
+++ b/mm_agents/coact/autogen/oai/together.py
@@ -0,0 +1,370 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+"""Create an OpenAI-compatible client using Together.AI's API.
+
+Example:
+    ```python
+    llm_config = {
+        "config_list": [
+            {
+                "api_type": "together",
+                "model": "mistralai/Mixtral-8x7B-Instruct-v0.1",
+                "api_key": os.environ.get("TOGETHER_API_KEY"),
+            }
+        ]
+    }
+
+    agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
+    ```
+
+Install Together.AI python library using: pip install --upgrade together
+
+Resources:
+- https://docs.together.ai/docs/inference-python
+"""
+
+from __future__ import annotations
+
+import copy
+import os
+import time
+import warnings
+from typing import Any, Literal, Optional, Union
+
+from pydantic import Field
+
+from ..import_utils import optional_import_block, require_optional_import
+from ..llm_config import LLMConfigEntry, register_llm_config
+from .client_utils import should_hide_tools, validate_parameter
+from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
+
+with optional_import_block():
+    from together import Together
+
+
+@register_llm_config
+class TogetherLLMConfigEntry(LLMConfigEntry):
+    api_type: Literal["together"] = "together"
+    max_tokens: int = Field(default=512, ge=0)
+    stream: bool = False
+    temperature: Optional[float] = Field(default=None)
+    top_p: Optional[float] = Field(default=None)
+    top_k: Optional[int] = Field(default=None)
+    repetition_penalty: Optional[float] = Field(default=None)
+    presence_penalty: Optional[float] = Field(default=None, ge=-2, le=2)
+    frequency_penalty: Optional[float] = Field(default=None, ge=-2, le=2)
+    min_p: Optional[float] = Field(default=None, ge=0, le=1)
+    safety_model: Optional[str] = None
+    hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
+    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
+    tool_choice: Optional[Union[str, dict[str, Union[str, dict[str, str]]]]] = (
+        None  # dict is the tool to call: {"type": "function", "function": {"name": "my_function"}}
+    )
+
+    def create_client(self):
+        raise NotImplementedError("TogetherLLMConfigEntry.create_client is not implemented.")
+
+
+class TogetherClient:
+    """Client for Together.AI's API."""
+
+    def __init__(self, **kwargs):
+        """Requires api_key or environment variable to be set
+
+        Args:
+            **kwargs: Additional keyword arguments to pass to the client.
+        """
+        # Ensure we have the api_key upon instantiation
+        self.api_key = kwargs.get("api_key")
+        if not self.api_key:
+            self.api_key = os.getenv("TOGETHER_API_KEY")
+
+        if "response_format" in kwargs and kwargs["response_format"] is not None:
+            warnings.warn("response_format is not supported for Together.AI, it will be ignored.", UserWarning)
+
+        assert self.api_key, (
+            "Please include the api_key in your config list entry for Together.AI or set the TOGETHER_API_KEY env variable."
+        )
+
+    def message_retrieval(self, response) -> list:
+        """Retrieve and return a list of strings or a list of Choice.Message from the response.
+
+        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
+        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
+        """
+        return [choice.message for choice in response.choices]
+
+    def cost(self, response) -> float:
+        return response.cost
+
+    @staticmethod
+    def get_usage(response) -> dict:
+        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
+        # ...  # pragma: no cover
+        return {
+            "prompt_tokens": response.usage.prompt_tokens,
+            "completion_tokens": response.usage.completion_tokens,
+            "total_tokens": response.usage.total_tokens,
+            "cost": response.cost,
+            "model": response.model,
+        }
+
+    def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
+        """Loads the parameters for Together.AI API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
+        together_params = {}
+
+        # Check that we have what we need to use Together.AI's API
+        together_params["model"] = params.get("model")
+        assert together_params["model"], (
+            "Please specify the 'model' in your config list entry to nominate the Together.AI model to use."
+        )
+
+        # Validate allowed Together.AI parameters
+        # https://github.com/togethercomputer/together-python/blob/94ffb30daf0ac3e078be986af7228f85f79bde99/src/together/resources/completions.py#L44
+        together_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, 512, (0, None), None)
+        together_params["stream"] = validate_parameter(params, "stream", bool, False, False, None, None)
+        together_params["temperature"] = validate_parameter(params, "temperature", (int, float), True, None, None, None)
+        together_params["top_p"] = validate_parameter(params, "top_p", (int, float), True, None, None, None)
+        together_params["top_k"] = validate_parameter(params, "top_k", int, True, None, None, None)
+        together_params["repetition_penalty"] = validate_parameter(
+            params, "repetition_penalty", float, True, None, None, None
+        )
+        together_params["presence_penalty"] = validate_parameter(
+            params, "presence_penalty", (int, float), True, None, (-2, 2), None
+        )
+        together_params["frequency_penalty"] = validate_parameter(
+            params, "frequency_penalty", (int, float), True, None, (-2, 2), None
+        )
+        together_params["min_p"] = validate_parameter(params, "min_p", (int, float), True, None, (0, 1), None)
+        together_params["safety_model"] = validate_parameter(
+            params, "safety_model", str, True, None, None, None
+        )  # We won't enforce the available models as they are likely to change
+
+        # Check if they want to stream and use tools, which isn't currently supported (TODO)
+        if together_params["stream"] and "tools" in params:
+            warnings.warn(
+                "Streaming is not supported when using tools, streaming will be disabled.",
+                UserWarning,
+            )
+
+            together_params["stream"] = False
+
+        if "tool_choice" in params:
+            together_params["tool_choice"] = params["tool_choice"]
+
+        return together_params
+
+    @require_optional_import("together", "together")
+    def create(self, params: dict) -> ChatCompletion:
+        messages = params.get("messages", [])
+
+        # Convert AG2 messages to Together.AI messages
+        together_messages = oai_messages_to_together_messages(messages)
+
+        # Parse parameters to Together.AI API's parameters
+        together_params = self.parse_params(params)
+
+        # Add tools to the call if we have them and aren't hiding them
+        if "tools" in params:
+            hide_tools = validate_parameter(
+                params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
+            )
+            if not should_hide_tools(together_messages, params["tools"], hide_tools):
+                together_params["tools"] = params["tools"]
+
+        together_params["messages"] = together_messages
+
+        # We use chat model by default
+        client = Together(api_key=self.api_key)
+
+        # Token counts will be returned
+        prompt_tokens = 0
+        completion_tokens = 0
+        total_tokens = 0
+
+        response = client.chat.completions.create(**together_params)
+        if together_params["stream"]:
+            # Read in the chunks as they stream
+            ans = ""
+            for chunk in response:
+                ans = ans + (chunk.choices[0].delta.content or "")
+
+            prompt_tokens = chunk.usage.prompt_tokens
+            completion_tokens = chunk.usage.completion_tokens
+            total_tokens = chunk.usage.total_tokens
+        else:
+            ans: str = response.choices[0].message.content
+
+            prompt_tokens = response.usage.prompt_tokens
+            completion_tokens = response.usage.completion_tokens
+            total_tokens = response.usage.total_tokens
+
+        if response.choices[0].finish_reason == "tool_calls":
+            together_finish = "tool_calls"
+            tool_calls = []
+            for tool_call in response.choices[0].message.tool_calls:
+                tool_calls.append(
+                    ChatCompletionMessageToolCall(
+                        id=tool_call.id,
+                        function={"name": tool_call.function.name, "arguments": tool_call.function.arguments},
+                        type="function",
+                    )
+                )
+        else:
+            together_finish = "stop"
+            tool_calls = None
+
+        # 3. convert output
+        message = ChatCompletionMessage(
+            role="assistant",
+            content=response.choices[0].message.content,
+            function_call=None,
+            tool_calls=tool_calls,
+        )
+        choices = [Choice(finish_reason=together_finish, index=0, message=message)]
+
+        response_oai = ChatCompletion(
+            id=response.id,
+            model=together_params["model"],
+            created=int(time.time()),
+            object="chat.completion",
+            choices=choices,
+            usage=CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=total_tokens,
+            ),
+            cost=calculate_together_cost(prompt_tokens, completion_tokens, together_params["model"]),
+        )
+
+        return response_oai
+
+
+def oai_messages_to_together_messages(messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Convert messages from OAI format to Together.AI format.
+    We correct for any specific role orders and types.
+    """
+    together_messages = copy.deepcopy(messages)
+
+    # If we have a message with role='tool', which occurs when a function is executed, change it to 'user'
+    for msg in together_messages:
+        if "role" in msg and msg["role"] == "tool":
+            msg["role"] = "user"
+
+    return together_messages
+
+
+# MODELS AND COSTS
+chat_lang_code_model_sizes = {
+    "zero-one-ai/Yi-34B-Chat": 34,
+    "allenai/OLMo-7B-Instruct": 7,
+    "allenai/OLMo-7B-Twin-2T": 7,
+    "allenai/OLMo-7B": 7,
+    "Austism/chronos-hermes-13b": 13,
+    "deepseek-ai/deepseek-coder-33b-instruct": 33,
+    "deepseek-ai/deepseek-llm-67b-chat": 67,
+    "garage-bAInd/Platypus2-70B-instruct": 70,
+    "google/gemma-2b-it": 2,
+    "google/gemma-7b-it": 7,
+    "Gryphe/MythoMax-L2-13b": 13,
+    "lmsys/vicuna-13b-v1.5": 13,
+    "lmsys/vicuna-7b-v1.5": 7,
+    "codellama/CodeLlama-13b-Instruct-hf": 13,
+    "codellama/CodeLlama-34b-Instruct-hf": 34,
+    "codellama/CodeLlama-70b-Instruct-hf": 70,
+    "codellama/CodeLlama-7b-Instruct-hf": 7,
+    "meta-llama/Llama-2-70b-chat-hf": 70,
+    "meta-llama/Llama-2-13b-chat-hf": 13,
+    "meta-llama/Llama-2-7b-chat-hf": 7,
+    "meta-llama/Llama-3-8b-chat-hf": 8,
+    "meta-llama/Llama-3-70b-chat-hf": 70,
+    "mistralai/Mistral-7B-Instruct-v0.1": 7,
+    "mistralai/Mistral-7B-Instruct-v0.2": 7,
+    "mistralai/Mistral-7B-Instruct-v0.3": 7,
+    "NousResearch/Nous-Capybara-7B-V1p9": 7,
+    "NousResearch/Nous-Hermes-llama-2-7b": 7,
+    "NousResearch/Nous-Hermes-Llama2-13b": 13,
+    "NousResearch/Nous-Hermes-2-Yi-34B": 34,
+    "openchat/openchat-3.5-1210": 7,
+    "Open-Orca/Mistral-7B-OpenOrca": 7,
+    "Qwen/Qwen1.5-0.5B-Chat": 0.5,
+    "Qwen/Qwen1.5-1.8B-Chat": 1.8,
+    "Qwen/Qwen1.5-4B-Chat": 4,
+    "Qwen/Qwen1.5-7B-Chat": 7,
+    "Qwen/Qwen1.5-14B-Chat": 14,
+    "Qwen/Qwen1.5-32B-Chat": 32,
+    "Qwen/Qwen1.5-72B-Chat": 72,
+    "Qwen/Qwen1.5-110B-Chat": 110,
+    "Qwen/Qwen2-72B-Instruct": 72,
+    "snorkelai/Snorkel-Mistral-PairRM-DPO": 7,
+    "togethercomputer/alpaca-7b": 7,
+    "teknium/OpenHermes-2-Mistral-7B": 7,
+    "teknium/OpenHermes-2p5-Mistral-7B": 7,
+    "togethercomputer/Llama-2-7B-32K-Instruct": 7,
+    "togethercomputer/RedPajama-INCITE-Chat-3B-v1": 3,
+    "togethercomputer/RedPajama-INCITE-7B-Chat": 7,
+    "togethercomputer/StripedHyena-Nous-7B": 7,
+    "Undi95/ReMM-SLERP-L2-13B": 13,
+    "Undi95/Toppy-M-7B": 7,
+    "WizardLM/WizardLM-13B-V1.2": 13,
+    "upstage/SOLAR-10.7B-Instruct-v1.0": 11,
+}
+
+# Cost per million tokens based on up to X Billion parameters, e.g. up 4B is $0.1/million
+chat_lang_code_model_costs = {4: 0.1, 8: 0.2, 21: 0.3, 41: 0.8, 80: 0.9, 110: 1.8}
+
+mixture_model_sizes = {
+    "cognitivecomputations/dolphin-2.5-mixtral-8x7b": 56,
+    "databricks/dbrx-instruct": 132,
+    "mistralai/Mixtral-8x7B-Instruct-v0.1": 47,
+    "mistralai/Mixtral-8x22B-Instruct-v0.1": 141,
+    "NousResearch/Nous-Hermes-2-Mistral-7B-DPO": 7,
+    "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 47,
+    "NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT": 47,
+    "Snowflake/snowflake-arctic-instruct": 480,
+}
+
+# Cost per million tokens based on up to X Billion parameters, e.g. up 56B is $0.6/million
+mixture_costs = {56: 0.6, 176: 1.2, 480: 2.4}
+
+
+def calculate_together_cost(input_tokens: int, output_tokens: int, model_name: str) -> float:
+    """Cost calculation for inference"""
+    if model_name in chat_lang_code_model_sizes or model_name in mixture_model_sizes:
+        cost_per_mil = 0
+
+        # Chat, Language, Code models
+        if model_name in chat_lang_code_model_sizes:
+            size_in_b = chat_lang_code_model_sizes[model_name]
+
+            for top_size in chat_lang_code_model_costs:
+                if size_in_b <= top_size:
+                    cost_per_mil = chat_lang_code_model_costs[top_size]
+                    break
+
+        else:
+            # Mixture-of-experts
+            size_in_b = mixture_model_sizes[model_name]
+
+            for top_size in mixture_costs:
+                if size_in_b <= top_size:
+                    cost_per_mil = mixture_costs[top_size]
+                    break
+
+        if cost_per_mil == 0:
+            warnings.warn("Model size doesn't align with cost structure.", UserWarning)
+
+        return cost_per_mil * ((input_tokens + output_tokens) / 1e6)
+
+    else:
+        # Model is not in our list of models, can't determine the cost
+        warnings.warn(
+            "The model isn't catered for costing, to apply costs you can use the 'price' key on your config_list.",
+            UserWarning,
+        )
+
+        return 0
diff --git a/mm_agents/coact/autogen/retrieve_utils.py b/mm_agents/coact/autogen/retrieve_utils.py
new file mode 100644
index 0000000..3a0c3a0
--- /dev/null
+++ b/mm_agents/coact/autogen/retrieve_utils.py
@@ -0,0 +1,491 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import glob
+import hashlib
+import logging
+import os
+import re
+from typing import Any, Callable, Optional, Union
+from urllib.parse import urlparse
+
+import requests
+
+from .import_utils import optional_import_block, require_optional_import
+from .token_count_utils import count_token
+
+with optional_import_block():
+    import chromadb
+    import markdownify
+    from bs4 import BeautifulSoup
+
+    if chromadb.__version__ < "0.4.15":
+        from chromadb.api import API
+    else:
+        from chromadb.api import ClientAPI as API  # noqa: N814
+    import chromadb.utils.embedding_functions as ef
+    import pypdf
+    from chromadb.api.types import QueryResult
+
+
+with optional_import_block() as result:
+    from unstructured.partition.auto import partition
+
+HAS_UNSTRUCTURED = result.is_successful
+
+logger = logging.getLogger(__name__)
+TEXT_FORMATS = [
+    "txt",
+    "json",
+    "csv",
+    "tsv",
+    "md",
+    "html",
+    "htm",
+    "rtf",
+    "rst",
+    "jsonl",
+    "log",
+    "xml",
+    "yaml",
+    "yml",
+    "pdf",
+    "mdx",
+]
+UNSTRUCTURED_FORMATS = [
+    "doc",
+    "docx",
+    "epub",
+    "msg",
+    "odt",
+    "org",
+    "pdf",
+    "ppt",
+    "pptx",
+    "rtf",
+    "rst",
+    "xlsx",
+]  # These formats will be parsed by the 'unstructured' library, if installed.
+if HAS_UNSTRUCTURED:
+    TEXT_FORMATS += UNSTRUCTURED_FORMATS
+    TEXT_FORMATS = list(set(TEXT_FORMATS))
+VALID_CHUNK_MODES = frozenset({"one_line", "multi_lines"})
+RAG_MINIMUM_MESSAGE_LENGTH = int(os.environ.get("RAG_MINIMUM_MESSAGE_LENGTH", 5))
+
+
+def split_text_to_chunks(
+    text: str,
+    max_tokens: int = 4000,
+    chunk_mode: str = "multi_lines",
+    must_break_at_empty_line: bool = True,
+    overlap: int = 0,  # number of overlapping lines
+):
+    """Split a long text into chunks of max_tokens."""
+    if chunk_mode not in VALID_CHUNK_MODES:
+        raise AssertionError
+    if chunk_mode == "one_line":
+        must_break_at_empty_line = False
+        overlap = 0
+    chunks = []
+    lines = text.split("\n")
+    num_lines = len(lines)
+    if num_lines < 3 and must_break_at_empty_line:
+        logger.warning("The input text has less than 3 lines. Set `must_break_at_empty_line` to `False`")
+        must_break_at_empty_line = False
+    lines_tokens = [count_token(line) for line in lines]
+    sum_tokens = sum(lines_tokens)
+    while sum_tokens > max_tokens:
+        estimated_line_cut = 2 if chunk_mode == "one_line" else max(int(max_tokens / sum_tokens * len(lines)), 2)
+        cnt = 0
+        prev = ""
+        for cnt in reversed(range(estimated_line_cut)):
+            if must_break_at_empty_line and lines[cnt].strip() != "":
+                continue
+            if sum(lines_tokens[:cnt]) <= max_tokens:
+                prev = "\n".join(lines[:cnt])
+                break
+        if cnt == 0:
+            logger.warning(
+                f"max_tokens is too small to fit a single line of text. Breaking this line:\n\t{lines[0][:100]} ..."
+            )
+            if not must_break_at_empty_line:
+                split_len = max(
+                    int(max_tokens / (lines_tokens[0] * 0.9 * len(lines[0]) + 0.1)), RAG_MINIMUM_MESSAGE_LENGTH
+                )
+                prev = lines[0][:split_len]
+                lines[0] = lines[0][split_len:]
+                lines_tokens[0] = count_token(lines[0])
+            else:
+                logger.warning("Failed to split docs with must_break_at_empty_line being True, set to False.")
+                must_break_at_empty_line = False
+        (
+            chunks.append(prev) if len(prev) >= RAG_MINIMUM_MESSAGE_LENGTH else None
+        )  # don't add chunks less than RAG_MINIMUM_MESSAGE_LENGTH characters
+        lines = lines[cnt - overlap if cnt > overlap else cnt :]
+        lines_tokens = lines_tokens[cnt - overlap if cnt > overlap else cnt :]
+        sum_tokens = sum(lines_tokens)
+    text_to_chunk = "\n".join(lines).strip()
+    (
+        chunks.append(text_to_chunk) if len(text_to_chunk) >= RAG_MINIMUM_MESSAGE_LENGTH else None
+    )  # don't add chunks less than RAG_MINIMUM_MESSAGE_LENGTH characters
+    return chunks
+
+
+@require_optional_import("pypdf", "retrievechat")
+def extract_text_from_pdf(file: str) -> str:
+    """Extract text from PDF files"""
+    text = ""
+    with open(file, "rb") as f:
+        reader = pypdf.PdfReader(f)
+        if reader.is_encrypted:  # Check if the PDF is encrypted
+            try:
+                reader.decrypt("")
+            except pypdf.errors.FileNotDecryptedError as e:
+                logger.warning(f"Could not decrypt PDF {file}, {e}")
+                return text  # Return empty text if PDF could not be decrypted
+
+        for page_num in range(len(reader.pages)):
+            page = reader.pages[page_num]
+            text += page.extract_text()
+
+    if not text.strip():  # Debugging line to check if text is empty
+        logger.warning(f"Could not decrypt PDF {file}")
+
+    return text
+
+
+def split_files_to_chunks(
+    files: list[Union[tuple[str, str], str]],
+    max_tokens: int = 4000,
+    chunk_mode: str = "multi_lines",
+    must_break_at_empty_line: bool = True,
+    custom_text_split_function: Optional[Callable[[str], list[str]]] = None,
+) -> tuple[list[str], list[dict[str, Any]]]:
+    """Split a list of files into chunks of max_tokens."""
+    chunks = []
+    sources = []
+
+    for file in files:
+        if isinstance(file, tuple):
+            url = file[1]
+            file = file[0]
+        else:
+            url = None
+        _, file_extension = os.path.splitext(file)
+        file_extension = file_extension.lower()
+
+        if HAS_UNSTRUCTURED and file_extension[1:] in UNSTRUCTURED_FORMATS:
+            text = partition(file)
+            text = "\n".join([t.text for t in text]) if len(text) > 0 else ""
+        elif file_extension == ".pdf":
+            text = extract_text_from_pdf(file)
+        else:  # For non-PDF text-based files
+            with open(file, encoding="utf-8", errors="ignore") as f:
+                text = f.read()
+
+        if not text.strip():  # Debugging line to check if text is empty after reading
+            logger.warning(f"No text available in file: {file}")
+            continue  # Skip to the next file if no text is available
+
+        if custom_text_split_function is not None:
+            tmp_chunks = custom_text_split_function(text)
+        else:
+            tmp_chunks = split_text_to_chunks(text, max_tokens, chunk_mode, must_break_at_empty_line)
+        chunks += tmp_chunks
+        sources += [{"source": url if url else file}] * len(tmp_chunks)
+
+    return chunks, sources
+
+
+def get_files_from_dir(
+    dir_path: Union[str, list[str]], types: list[str] = TEXT_FORMATS, recursive: bool = True
+) -> list[Any]:
+    """Return a list of all the files in a given directory, a url, a file path or a list of them."""
+    if len(types) == 0:
+        raise ValueError("types cannot be empty.")
+    types = [t[1:].lower() if t.startswith(".") else t.lower() for t in set(types)]
+    types += [t.upper() for t in types]
+
+    files = []
+    # If the path is a list of files or urls, process and return them
+    if isinstance(dir_path, list):
+        for item in dir_path:
+            if os.path.isfile(item):
+                files.append(item)
+            elif is_url(item):
+                filepath = get_file_from_url(item)
+                if filepath:
+                    files.append(filepath)
+            elif os.path.exists(item):
+                try:
+                    files.extend(get_files_from_dir(item, types, recursive))
+                except ValueError:
+                    logger.warning(f"Directory {item} does not exist. Skipping.")
+            else:
+                logger.warning(f"File {item} does not exist. Skipping.")
+        return files
+
+    # If the path is a file, return it
+    if os.path.isfile(dir_path):
+        return [dir_path]
+
+    # If the path is a url, download it and return the downloaded file
+    if is_url(dir_path):
+        filepath = get_file_from_url(dir_path)
+        if filepath:
+            return [filepath]
+        else:
+            return []
+
+    if os.path.exists(dir_path):
+        for type in types:
+            if recursive:
+                files += glob.glob(os.path.join(dir_path, f"**/*.{type}"), recursive=True)
+            else:
+                files += glob.glob(os.path.join(dir_path, f"*.{type}"), recursive=False)
+    else:
+        logger.error(f"Directory {dir_path} does not exist.")
+        raise ValueError(f"Directory {dir_path} does not exist.")
+    return files
+
+
+@require_optional_import(["markdownify", "bs4"], "retrievechat")
+def parse_html_to_markdown(html: str, url: str = None) -> str:
+    """Parse HTML to markdown."""
+    soup = BeautifulSoup(html, "html.parser")
+    title = soup.title.string
+    # Remove javascript and style blocks
+    for script in soup(["script", "style"]):
+        script.extract()
+
+    # Convert to markdown -- Wikipedia gets special attention to get a clean version of the page
+    if isinstance(url, str) and url.startswith("https://en.wikipedia.org/"):
+        body_elm = soup.find("div", {"id": "mw-content-text"})
+        title_elm = soup.find("span", {"class": "mw-page-title-main"})
+
+        if body_elm:
+            # What's the title
+            main_title = soup.title.string
+            if title_elm and len(title_elm) > 0:
+                main_title = title_elm.string
+            webpage_text = "# " + main_title + "\n\n" + markdownify.MarkdownConverter().convert_soup(body_elm)
+        else:
+            webpage_text = markdownify.MarkdownConverter().convert_soup(soup)
+    else:
+        webpage_text = markdownify.MarkdownConverter().convert_soup(soup)
+
+    # Convert newlines
+    webpage_text = re.sub(r"\r\n", "\n", webpage_text)
+    webpage_text = re.sub(r"\n{2,}", "\n\n", webpage_text).strip()
+    webpage_text = "# " + title + "\n\n" + webpage_text
+    return webpage_text
+
+
+def _generate_file_name_from_url(url: str, max_length=255) -> str:
+    url_bytes = url.encode("utf-8")
+    hash = hashlib.blake2b(url_bytes).hexdigest()
+    parsed_url = urlparse(url)
+    file_name = os.path.basename(url)
+    file_name = (
+        f"{parsed_url.netloc}_{file_name}_{hash[: min(8, max_length - len(parsed_url.netloc) - len(file_name) - 1)]}"
+    )
+    return file_name
+
+
+def get_file_from_url(url: str, save_path: str = None) -> tuple[str, str]:
+    """Download a file from a URL."""
+    if save_path is None:
+        save_path = "tmp/chromadb"
+        os.makedirs(save_path, exist_ok=True)
+    if os.path.isdir(save_path):
+        filename = _generate_file_name_from_url(url)
+        save_path = os.path.join(save_path, filename)
+    else:
+        os.makedirs(os.path.dirname(save_path), exist_ok=True)
+
+    custom_headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36",
+    }
+    try:
+        response = requests.get(url, stream=True, headers=custom_headers, timeout=30)
+        response.raise_for_status()
+    except requests.exceptions.RequestException as e:
+        logger.warning(f"Failed to download {url}, {e}")
+        return None
+
+    content_type = response.headers.get("content-type", "")
+    if "text/html" in content_type:
+        # Get the content of the response
+        html = ""
+        for chunk in response.iter_content(chunk_size=8192, decode_unicode=True):
+            html += chunk
+        text = parse_html_to_markdown(html, url)
+        with open(save_path, "w", encoding="utf-8") as f:
+            f.write(text)
+    else:
+        with open(save_path, "wb") as f:
+            for chunk in response.iter_content(chunk_size=8192):
+                f.write(chunk)
+    return save_path, url
+
+
+def is_url(string: str):
+    """Return True if the string is a valid URL."""
+    try:
+        result = urlparse(string)
+        return all([result.scheme, result.netloc])
+    except ValueError:
+        return False
+
+
+@require_optional_import("chromadb", "retrievechat")
+def create_vector_db_from_dir(
+    dir_path: Union[str, list[str]],
+    max_tokens: int = 4000,
+    client: "API" = None,
+    db_path: str = "tmp/chromadb.db",
+    collection_name: str = "all-my-documents",
+    get_or_create: bool = False,
+    chunk_mode: str = "multi_lines",
+    must_break_at_empty_line: bool = True,
+    embedding_model: str = "all-MiniLM-L6-v2",
+    embedding_function: Callable = None,
+    custom_text_split_function: Callable = None,
+    custom_text_types: list[str] = TEXT_FORMATS,
+    recursive: bool = True,
+    extra_docs: bool = False,
+) -> "API":
+    """Create a vector db from all the files in a given directory, the directory can also be a single file or a url to
+        a single file. We support chromadb compatible APIs to create the vector db, this function is not required if
+        you prepared your own vector db.
+
+    Args:
+        dir_path (Union[str, List[str]]): the path to the directory, file, url or a list of them.
+        max_tokens (Optional, int): the maximum number of tokens per chunk. Default is 4000.
+        client (Optional, API): the chromadb client. Default is None.
+        db_path (Optional, str): the path to the chromadb. Default is "tmp/chromadb.db". The default was `/tmp/chromadb.db` for version `<=0.2.24`.
+        collection_name (Optional, str): the name of the collection. Default is "all-my-documents".
+        get_or_create (Optional, bool): Whether to get or create the collection. Default is False. If True, the collection
+            will be returned if it already exists. Will raise ValueError if the collection already exists and get_or_create is False.
+        chunk_mode (Optional, str): the chunk mode. Default is "multi_lines".
+        must_break_at_empty_line (Optional, bool): Whether to break at empty line. Default is True.
+        embedding_model (Optional, str): the embedding model to use. Default is "all-MiniLM-L6-v2". Will be ignored if
+            embedding_function is not None.
+        embedding_function (Optional, Callable): the embedding function to use. Default is None, SentenceTransformer with
+            the given `embedding_model` will be used. If you want to use OpenAI, Cohere, HuggingFace or other embedding
+            functions, you can pass it here, follow the examples in `https://docs.trychroma.com/embeddings`.
+        custom_text_split_function (Optional, Callable): a custom function to split a string into a list of strings.
+            Default is None, will use the default function in `autogen.retrieve_utils.split_text_to_chunks`.
+        custom_text_types (Optional, List[str]): a list of file types to be processed. Default is TEXT_FORMATS.
+        recursive (Optional, bool): whether to search documents recursively in the dir_path. Default is True.
+        extra_docs (Optional, bool): whether to add more documents in the collection. Default is False
+
+    Returns:
+    The chromadb client.
+    """
+    if client is None:
+        client = chromadb.PersistentClient(path=db_path)
+    try:
+        embedding_function = (
+            ef.SentenceTransformerEmbeddingFunction(embedding_model)
+            if embedding_function is None
+            else embedding_function
+        )
+        collection = client.create_collection(
+            collection_name,
+            get_or_create=get_or_create,
+            embedding_function=embedding_function,
+            # https://github.com/nmslib/hnswlib#supported-distances
+            # https://github.com/chroma-core/chroma/blob/566bc80f6c8ee29f7d99b6322654f32183c368c4/chromadb/segment/impl/vector/local_hnsw.py#L184
+            # https://github.com/nmslib/hnswlib/blob/master/ALGO_PARAMS.md
+            metadata={"hnsw:space": "ip", "hnsw:construction_ef": 30, "hnsw:M": 32},  # ip, l2, cosine
+        )
+
+        length = 0
+        if extra_docs:
+            length = len(collection.get()["ids"])
+
+        if custom_text_split_function is not None:
+            chunks, sources = split_files_to_chunks(
+                get_files_from_dir(dir_path, custom_text_types, recursive),
+                custom_text_split_function=custom_text_split_function,
+            )
+        else:
+            chunks, sources = split_files_to_chunks(
+                get_files_from_dir(dir_path, custom_text_types, recursive),
+                max_tokens,
+                chunk_mode,
+                must_break_at_empty_line,
+            )
+        logger.info(f"Found {len(chunks)} chunks.")
+        # Upsert in batch of 40000 or less if the total number of chunks is less than 40000
+        for i in range(0, len(chunks), min(40000, len(chunks))):
+            end_idx = i + min(40000, len(chunks) - i)
+            collection.upsert(
+                documents=chunks[i:end_idx],
+                ids=[f"doc_{j + length}" for j in range(i, end_idx)],  # unique for each doc
+                metadatas=sources[i:end_idx],
+            )
+    except ValueError as e:
+        logger.warning(f"{e}")
+    return client
+
+
+@require_optional_import("chromadb", "retrievechat")
+def query_vector_db(
+    query_texts: list[str],
+    n_results: int = 10,
+    client: "API" = None,
+    db_path: str = "tmp/chromadb.db",
+    collection_name: str = "all-my-documents",
+    search_string: str = "",
+    embedding_model: str = "all-MiniLM-L6-v2",
+    embedding_function: Callable = None,
+) -> "QueryResult":
+    """Query a vector db. We support chromadb compatible APIs, it's not required if you prepared your own vector db
+        and query function.
+
+    Args:
+        query_texts (List[str]): the list of strings which will be used to query the vector db.
+        n_results (Optional, int): the number of results to return. Default is 10.
+        client (Optional, API): the chromadb compatible client. Default is None, a chromadb client will be used.
+        db_path (Optional, str): the path to the vector db. Default is "tmp/chromadb.db". The default was `/tmp/chromadb.db` for version `<=0.2.24`.
+        collection_name (Optional, str): the name of the collection. Default is "all-my-documents".
+        search_string (Optional, str): the search string. Only docs that contain an exact match of this string will be retrieved. Default is "".
+        embedding_model (Optional, str): the embedding model to use. Default is "all-MiniLM-L6-v2". Will be ignored if
+            embedding_function is not None.
+        embedding_function (Optional, Callable): the embedding function to use. Default is None, SentenceTransformer with
+            the given `embedding_model` will be used. If you want to use OpenAI, Cohere, HuggingFace or other embedding
+            functions, you can pass it here, follow the examples in `https://docs.trychroma.com/embeddings`.
+
+    Returns:
+        The query result. The format is:
+
+    ```python
+    class QueryResult(TypedDict):
+        ids: List[IDs]
+        embeddings: Optional[List[List[Embedding]]]
+        documents: Optional[List[List[Document]]]
+        metadatas: Optional[List[List[Metadata]]]
+        distances: Optional[List[List[float]]]
+    ```
+    """
+    if client is None:
+        client = chromadb.PersistentClient(path=db_path)
+    # the collection's embedding function is always the default one, but we want to use the one we used to create the
+    # collection. So we compute the embeddings ourselves and pass it to the query function.
+    collection = client.get_collection(collection_name)
+    embedding_function = (
+        ef.SentenceTransformerEmbeddingFunction(embedding_model) if embedding_function is None else embedding_function
+    )
+    query_embeddings = embedding_function(query_texts)
+    # Query/search n most similar results. You can also .get by id
+    results = collection.query(
+        query_embeddings=query_embeddings,
+        n_results=n_results,
+        where_document={"$contains": search_string} if search_string else None,  # optional filter
+    )
+    return results
diff --git a/mm_agents/coact/autogen/runtime_logging.py b/mm_agents/coact/autogen/runtime_logging.py
new file mode 100644
index 0000000..bd8112d
--- /dev/null
+++ b/mm_agents/coact/autogen/runtime_logging.py
@@ -0,0 +1,160 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+from __future__ import annotations
+
+import logging
+import sqlite3
+import uuid
+from typing import TYPE_CHECKING, Any, Callable, Literal, Optional, TypeVar
+
+from .logger.base_logger import BaseLogger, LLMConfig
+from .logger.logger_factory import LoggerFactory
+
+if TYPE_CHECKING:
+    from openai import AzureOpenAI, OpenAI
+    from openai.types.chat import ChatCompletion
+
+    from . import Agent, ConversableAgent, OpenAIWrapper
+    from .oai.anthropic import AnthropicClient
+    from .oai.bedrock import BedrockClient
+    from .oai.cerebras import CerebrasClient
+    from .oai.cohere import CohereClient
+    from .oai.gemini import GeminiClient
+    from .oai.groq import GroqClient
+    from .oai.mistral import MistralAIClient
+    from .oai.ollama import OllamaClient
+    from .oai.together import TogetherClient
+
+logger = logging.getLogger(__name__)
+
+autogen_logger = None
+is_logging = False
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+def start(
+    logger: Optional[BaseLogger] = None,
+    logger_type: Literal["sqlite", "file"] = "sqlite",
+    config: Optional[dict[str, Any]] = None,
+) -> str:
+    """Start logging for the runtime.
+
+    Args:
+        logger (BaseLogger):    A logger instance
+        logger_type (str):      The type of logger to use (default: sqlite)
+        config (dict):          Configuration for the logger
+    Returns:
+        session_id (str(uuid.uuid4)):       a unique id for the logging session
+    """
+    global autogen_logger
+    global is_logging
+
+    autogen_logger = logger or LoggerFactory.get_logger(logger_type=logger_type, config=config)
+
+    try:
+        session_id = autogen_logger.start()
+        is_logging = True
+    except Exception as e:
+        logger.error(f"[runtime logging] Failed to start logging: {e}")
+    finally:
+        return session_id
+
+
+def log_chat_completion(
+    invocation_id: uuid.UUID,
+    client_id: int,
+    wrapper_id: int,
+    agent: str | Agent,
+    request: dict[str, float | str | list[dict[str, str]]],
+    response: str | "ChatCompletion",
+    is_cached: int,
+    cost: float,
+    start_time: str,
+) -> None:
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_chat_completion: autogen logger is None")
+        return
+
+    autogen_logger.log_chat_completion(
+        invocation_id, client_id, wrapper_id, agent, request, response, is_cached, cost, start_time
+    )
+
+
+def log_new_agent(agent: ConversableAgent, init_args: dict[str, Any]) -> None:
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_new_agent: autogen logger is None")
+        return
+
+    autogen_logger.log_new_agent(agent, init_args)
+
+
+def log_event(source: str | Agent, name: str, **kwargs: dict[str, Any]) -> None:
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_event: autogen logger is None")
+        return
+
+    autogen_logger.log_event(source, name, **kwargs)
+
+
+def log_function_use(agent: str | Agent, function: F, args: dict[str, Any], returns: any):
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_function_use: autogen logger is None")
+        return
+
+    autogen_logger.log_function_use(agent, function, args, returns)
+
+
+def log_new_wrapper(wrapper: OpenAIWrapper, init_args: dict[str, LLMConfig | list[LLMConfig]]) -> None:
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_new_wrapper: autogen logger is None")
+        return
+
+    autogen_logger.log_new_wrapper(wrapper, init_args)
+
+
+def log_new_client(
+    client: (
+        AzureOpenAI
+        | OpenAI
+        | CerebrasClient
+        | GeminiClient
+        | AnthropicClient
+        | MistralAIClient
+        | TogetherClient
+        | GroqClient
+        | CohereClient
+        | OllamaClient
+        | BedrockClient
+    ),
+    wrapper: OpenAIWrapper,
+    init_args: dict[str, Any],
+) -> None:
+    if autogen_logger is None:
+        logger.error("[runtime logging] log_new_client: autogen logger is None")
+        return
+
+    autogen_logger.log_new_client(client, wrapper, init_args)
+
+
+def stop() -> None:
+    global is_logging
+    if autogen_logger:
+        autogen_logger.stop()
+    is_logging = False
+
+
+def get_connection() -> None | sqlite3.Connection:
+    if autogen_logger is None:
+        logger.error("[runtime logging] get_connection: autogen logger is None")
+        return None
+
+    return autogen_logger.get_connection()
+
+
+def logging_enabled() -> bool:
+    return is_logging
diff --git a/mm_agents/coact/autogen/token_count_utils.py b/mm_agents/coact/autogen/token_count_utils.py
new file mode 100644
index 0000000..a979211
--- /dev/null
+++ b/mm_agents/coact/autogen/token_count_utils.py
@@ -0,0 +1,265 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import json
+import logging
+import re
+from typing import Any, Union
+
+import tiktoken
+
+from .agentchat.contrib.img_utils import num_tokens_from_gpt_image
+from .import_utils import optional_import_block
+
+# if PIL is not imported, we will redefine num_tokens_from_gpt_image to return 0 tokens for images
+# Otherwise, it would raise an ImportError
+with optional_import_block() as result:
+    import PIL  # noqa: F401
+
+pil_imported = result.is_successful
+if not pil_imported:
+
+    def num_tokens_from_gpt_image(*args, **kwargs):
+        return 0
+
+
+logger = logging.getLogger(__name__)
+logger.img_dependency_warned = False  # member variable to track if the warning has been logged
+
+
+def get_max_token_limit(model: str = "gpt-3.5-turbo-0613") -> int:
+    # Handle common azure model names/aliases
+    model = re.sub(r"^gpt\-?35", "gpt-3.5", model)
+    model = re.sub(r"^gpt4", "gpt-4", model)
+
+    max_token_limit = {
+        "gpt-3.5-turbo": 16385,
+        "gpt-3.5-turbo-0125": 16385,
+        "gpt-3.5-turbo-0301": 4096,
+        "gpt-3.5-turbo-0613": 4096,
+        "gpt-3.5-turbo-instruct": 4096,
+        "gpt-3.5-turbo-16k": 16385,
+        "gpt-3.5-turbo-16k-0613": 16385,
+        "gpt-3.5-turbo-1106": 16385,
+        "gpt-4": 8192,
+        "gpt-4-turbo": 128000,
+        "gpt-4-turbo-2024-04-09": 128000,
+        "gpt-4-32k": 32768,
+        "gpt-4-32k-0314": 32768,  # deprecate in Sep
+        "gpt-4-0314": 8192,  # deprecate in Sep
+        "gpt-4-0613": 8192,
+        "gpt-4-32k-0613": 32768,
+        "gpt-4-1106-preview": 128000,
+        "gpt-4-0125-preview": 128000,
+        "gpt-4-turbo-preview": 128000,
+        "gpt-4-vision-preview": 128000,
+        "gpt-4o": 128000,
+        "gpt-4o-2024-05-13": 128000,
+        "gpt-4o-2024-08-06": 128000,
+        "gpt-4o-2024-11-20": 128000,
+        "gpt-4o-mini": 128000,
+        "gpt-4o-mini-2024-07-18": 128000,
+    }
+    return max_token_limit[model]
+
+
+def percentile_used(input, model="gpt-3.5-turbo-0613"):
+    return count_token(input) / get_max_token_limit(model)
+
+
+def token_left(input: Union[str, list[str], dict[str, Any]], model="gpt-3.5-turbo-0613") -> int:
+    """Count number of tokens left for an OpenAI model.
+
+    Args:
+        input: (str, list, dict): Input to the model.
+        model: (str): Model name.
+
+    Returns:
+        int: Number of tokens left that the model can use for completion.
+    """
+    return get_max_token_limit(model) - count_token(input, model=model)
+
+
+def count_token(input: Union[str, list[str], dict[str, Any]], model: str = "gpt-3.5-turbo-0613") -> int:
+    """Count number of tokens used by an OpenAI model.
+
+    Args:
+        input: (str, list, dict): Input to the model.
+        model: (str): Model name.
+
+    Returns:
+        int: Number of tokens from the input.
+    """
+    if isinstance(input, str):
+        return _num_token_from_text(input, model=model)
+    elif isinstance(input, (list, dict)):
+        return _num_token_from_messages(input, model=model)
+    else:
+        raise ValueError(f"input must be str, list or dict, but we got {type(input)}")
+
+
+def _num_token_from_text(text: str, model: str = "gpt-3.5-turbo-0613"):
+    """Return the number of tokens used by a string."""
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+        logger.warning(f"Model {model} not found. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+    return len(encoding.encode(text))
+
+
+def _num_token_from_messages(messages: Union[list[str], dict[str, Any]], model="gpt-3.5-turbo-0613"):
+    """Return the number of tokens used by a list of messages.
+
+    retrieved from https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb/
+    """
+    if isinstance(messages, dict):
+        messages = [messages]
+
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+        logger.warning(f"Model {model} not found. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+    if model in {
+        "gpt-3.5-turbo-0613",
+        "gpt-3.5-turbo-16k-0613",
+        "gpt-4-0314",
+        "gpt-4-32k-0314",
+        "gpt-4-0613",
+        "gpt-4-32k-0613",
+        "gpt-4-turbo-preview",
+        "gpt-4-vision-preview",
+        "gpt-4o",
+        "gpt-4o-2024-05-13",
+        "gpt-4o-2024-08-06",
+        "gpt-4o-2024-11-20",
+        "gpt-4o-mini",
+        "gpt-4o-mini-2024-07-18",
+    }:
+        tokens_per_message = 3
+        tokens_per_name = 1
+    elif model == "gpt-3.5-turbo-0301":
+        tokens_per_message = 4  # every message follows <|start|>{role/name}\n{content}<|end|>\n
+        tokens_per_name = -1  # if there's a name, the role is omitted
+    elif "gpt-3.5-turbo" in model:
+        logger.info("gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.")
+        return _num_token_from_messages(messages, model="gpt-3.5-turbo-0613")
+    elif "gpt-4" in model:
+        logger.info("gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.")
+        return _num_token_from_messages(messages, model="gpt-4-0613")
+    elif "gemini" in model:
+        logger.info("Gemini is not supported in tiktoken. Returning num tokens assuming gpt-4-0613.")
+        return _num_token_from_messages(messages, model="gpt-4-0613")
+    elif "claude" in model:
+        logger.info("Claude is not supported in tiktoken. Returning num tokens assuming gpt-4-0613.")
+        return _num_token_from_messages(messages, model="gpt-4-0613")
+    elif "mistral-" in model or "mixtral-" in model:
+        logger.info("Mistral.AI models are not supported in tiktoken. Returning num tokens assuming gpt-4-0613.")
+        return _num_token_from_messages(messages, model="gpt-4-0613")
+    elif "deepseek" in model:
+        logger.info("Deepseek models are not supported in tiktoken. Returning num tokens assuming gpt-4-0613.")
+        return _num_token_from_messages(messages, model="gpt-4-0613")
+    else:
+        raise NotImplementedError(
+            f"""_num_token_from_messages() is not implemented for model {model}. See https://github.com/openai/openai-python/blob/main/chatml.md for information on how messages are converted to tokens."""
+        )
+    num_tokens = 0
+    for message in messages:
+        num_tokens += tokens_per_message
+        for key, value in message.items():
+            if value is None:
+                continue
+
+            # handle content if images are in GPT-4-vision
+            if key == "content" and isinstance(value, list):
+                for part in value:
+                    if not isinstance(part, dict) or "type" not in part:
+                        continue
+                    if part["type"] == "text":
+                        num_tokens += len(encoding.encode(part["text"]))
+                    if "image_url" in part:
+                        if not pil_imported and not logger.img_dependency_warned:
+                            logger.warning(
+                                "img_utils or PIL not imported. Skipping image token count."
+                                "Please install autogen with [lmm] option.",
+                            )
+                            logger.img_dependency_warned = True
+                        try:
+                            num_tokens += num_tokens_from_gpt_image(
+                                image_data=part["image_url"]["url"], model=model
+                            )
+                        except ValueError as e:
+                            logger.warning(f"Error in num_tokens_from_gpt_image: {e}")
+                continue
+
+            # function calls
+            if not isinstance(value, str):
+                try:
+                    value = json.dumps(value)
+                except TypeError:
+                    logger.warning(
+                        f"Value {value} is not a string and cannot be converted to json. It is a type: {type(value)} Skipping."
+                    )
+                    continue
+
+            num_tokens += len(encoding.encode(value))
+            if key == "name":
+                num_tokens += tokens_per_name
+    num_tokens += 3  # every reply is primed with <|start|>assistant<|message|>
+    return num_tokens
+
+
+def num_tokens_from_functions(functions, model="gpt-3.5-turbo-0613") -> int:
+    """Return the number of tokens used by a list of functions.
+
+    Args:
+        functions: (list): List of function descriptions that will be passed in model.
+        model: (str): Model name.
+
+    Returns:
+        int: Number of tokens from the function descriptions.
+    """
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+        logger.warning(f"Model {model} not found. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+
+    num_tokens = 0
+    for function in functions:
+        function_tokens = len(encoding.encode(function["name"]))
+        function_tokens += len(encoding.encode(function["description"]))
+        function_tokens -= 2
+        if "parameters" in function:
+            parameters = function["parameters"]
+            if "properties" in parameters:
+                for properties_key in parameters["properties"]:
+                    function_tokens += len(encoding.encode(properties_key))
+                    v = parameters["properties"][properties_key]
+                    for field in v:
+                        if field == "type":
+                            function_tokens += 2
+                            function_tokens += len(encoding.encode(v["type"]))
+                        elif field == "description":
+                            function_tokens += 2
+                            function_tokens += len(encoding.encode(v["description"]))
+                        elif field == "enum":
+                            function_tokens -= 3
+                            for o in v["enum"]:
+                                function_tokens += 3
+                                function_tokens += len(encoding.encode(o))
+                        else:
+                            logger.warning(f"Not supported field {field}")
+                function_tokens += 11
+                if len(parameters["properties"]) == 0:
+                    function_tokens -= 2
+
+        num_tokens += function_tokens
+
+    num_tokens += 12
+    return num_tokens
diff --git a/mm_agents/coact/autogen/tools/__init__.py b/mm_agents/coact/autogen/tools/__init__.py
new file mode 100644
index 0000000..592537e
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/__init__.py
@@ -0,0 +1,20 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .dependency_injection import BaseContext, ChatContext, Depends
+from .function_utils import get_function_schema, load_basemodels_if_needed, serialize_to_str
+from .tool import Tool, tool
+from .toolkit import Toolkit
+
+__all__ = [
+    "BaseContext",
+    "ChatContext",
+    "Depends",
+    "Tool",
+    "Toolkit",
+    "get_function_schema",
+    "load_basemodels_if_needed",
+    "serialize_to_str",
+    "tool",
+]
diff --git a/mm_agents/coact/autogen/tools/contrib/__init__.py b/mm_agents/coact/autogen/tools/contrib/__init__.py
new file mode 100644
index 0000000..b762722
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/contrib/__init__.py
@@ -0,0 +1,9 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .time import TimeTool
+
+__all__ = [
+    "TimeTool",
+]
diff --git a/mm_agents/coact/autogen/tools/contrib/time/__init__.py b/mm_agents/coact/autogen/tools/contrib/time/__init__.py
new file mode 100644
index 0000000..6a164e6
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/contrib/time/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .time import TimeTool
+
+__all__ = ["TimeTool"]
diff --git a/mm_agents/coact/autogen/tools/contrib/time/time.py b/mm_agents/coact/autogen/tools/contrib/time/time.py
new file mode 100644
index 0000000..bd8f038
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/contrib/time/time.py
@@ -0,0 +1,41 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from datetime import datetime
+from typing import Annotated
+
+from autogen.tools import Tool
+
+from ....doc_utils import export_module
+
+__all__ = ["TimeTool"]
+
+
+@export_module("autogen.tools.contrib")  # API Reference: autogen > tools > contrib > TimeAgent
+class TimeTool(Tool):
+    """Outputs the current date and time of the computer."""
+
+    def __init__(
+        self,
+        *,
+        date_time_format: str = "%Y-%m-%d %H:%M:%S",  # This is a parameter that is unique to this tool
+    ):
+        """Get the date and time of the computer.
+
+        Args:
+            date_time_format (str, optional): The format of the date and time. Defaults to "%Y-%m-%d %H:%M:%S".
+        """
+
+        self._date_time_format = date_time_format
+
+        async def get_date_and_time(
+            date_time_format: Annotated[str, "date/time Python format"] = self._date_time_format,
+        ) -> str:
+            return datetime.now().strftime(date_time_format)
+
+        super().__init__(
+            name="date_time",
+            description="Get the current computer's date and time.",
+            func_or_tool=get_date_and_time,
+        )
diff --git a/mm_agents/coact/autogen/tools/dependency_injection.py b/mm_agents/coact/autogen/tools/dependency_injection.py
new file mode 100644
index 0000000..026f146
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/dependency_injection.py
@@ -0,0 +1,254 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import functools
+import inspect
+import sys
+from abc import ABC
+from functools import wraps
+from typing import TYPE_CHECKING, Any, Callable, Iterable, Optional, TypeVar, Union, get_type_hints
+
+from ..agentchat import Agent
+from ..doc_utils import export_module
+from ..fast_depends import Depends as FastDepends
+from ..fast_depends import inject
+from ..fast_depends.dependencies import model
+
+if TYPE_CHECKING:
+    from ..agentchat.conversable_agent import ConversableAgent
+
+__all__ = [
+    "BaseContext",
+    "ChatContext",
+    "Depends",
+    "Field",
+    "get_context_params",
+    "inject_params",
+    "on",
+    "remove_params",
+]
+
+
+@export_module("autogen.tools")
+class BaseContext(ABC):
+    """Base class for context classes.
+
+    This is the base class for defining various context types that may be used
+    throughout the application. It serves as a parent for specific context classes.
+    """
+
+    pass
+
+
+@export_module("autogen.tools")
+class ChatContext(BaseContext):
+    """ChatContext class that extends BaseContext.
+
+    This class is used to represent a chat context that holds a list of messages.
+    It inherits from `BaseContext` and adds the `messages` attribute.
+    """
+
+    def __init__(self, agent: "ConversableAgent") -> None:
+        """Initializes the ChatContext with an agent.
+
+        Args:
+            agent: The agent to use for retrieving chat messages.
+        """
+        self._agent = agent
+
+    @property
+    def chat_messages(self) -> dict[Agent, list[dict[Any, Any]]]:
+        """The messages in the chat.
+
+        Returns:
+            A dictionary of agents and their messages.
+        """
+        return self._agent.chat_messages
+
+    @property
+    def last_message(self) -> Optional[dict[str, Any]]:
+        """The last message in the chat.
+
+        Returns:
+            The last message in the chat.
+        """
+        return self._agent.last_message()
+
+
+T = TypeVar("T")
+
+
+def on(x: T) -> Callable[[], T]:
+    def inner(ag2_x: T = x) -> T:
+        return ag2_x
+
+    return inner
+
+
+@export_module("autogen.tools")
+def Depends(x: Any) -> Any:  # noqa: N802
+    """Creates a dependency for injection based on the provided context or type.
+
+    Args:
+        x: The context or dependency to be injected.
+
+    Returns:
+        A FastDepends object that will resolve the dependency for injection.
+    """
+    if isinstance(x, BaseContext):
+        return FastDepends(lambda: x)
+
+    return FastDepends(x)
+
+
+def get_context_params(func: Callable[..., Any], subclass: Union[type[BaseContext], type[ChatContext]]) -> list[str]:
+    """Gets the names of the context parameters in a function signature.
+
+    Args:
+        func: The function to inspect for context parameters.
+        subclass: The subclass to search for.
+
+    Returns:
+        A list of parameter names that are instances of the specified subclass.
+    """
+    sig = inspect.signature(func)
+    return [p.name for p in sig.parameters.values() if _is_context_param(p, subclass=subclass)]
+
+
+def _is_context_param(
+    param: inspect.Parameter, subclass: Union[type[BaseContext], type[ChatContext]] = BaseContext
+) -> bool:
+    # param.annotation.__args__[0] is used to handle Annotated[MyContext, Depends(MyContext(b=2))]
+    param_annotation = param.annotation.__args__[0] if hasattr(param.annotation, "__args__") else param.annotation
+    try:
+        return isinstance(param_annotation, type) and issubclass(param_annotation, subclass)
+    except TypeError:
+        return False
+
+
+def _is_depends_param(param: inspect.Parameter) -> bool:
+    return isinstance(param.default, model.Depends) or (
+        hasattr(param.annotation, "__metadata__")
+        and type(param.annotation.__metadata__) == tuple
+        and isinstance(param.annotation.__metadata__[0], model.Depends)
+    )
+
+
+def remove_params(func: Callable[..., Any], sig: inspect.Signature, params: Iterable[str]) -> None:
+    new_signature = sig.replace(parameters=[p for p in sig.parameters.values() if p.name not in params])
+    func.__signature__ = new_signature  # type: ignore[attr-defined]
+
+
+def _remove_injected_params_from_signature(func: Callable[..., Any]) -> Callable[..., Any]:
+    # This is a workaround for Python 3.9+ where staticmethod.__func__ is accessible
+    if sys.version_info >= (3, 9) and isinstance(func, staticmethod) and hasattr(func, "__func__"):
+        func = _fix_staticmethod(func)
+
+    sig = inspect.signature(func)
+    params_to_remove = [p.name for p in sig.parameters.values() if _is_context_param(p) or _is_depends_param(p)]
+    remove_params(func, sig, params_to_remove)
+    return func
+
+
+class Field:
+    """Represents a description field for use in type annotations.
+
+    This class is used to store a description for an annotated field, often used for
+    documenting or validating fields in a context or data model.
+    """
+
+    def __init__(self, description: str) -> None:
+        """Initializes the Field with a description.
+
+        Args:
+            description: The description text for the field.
+        """
+        self._description = description
+
+    @property
+    def description(self) -> str:
+        return self._description
+
+
+def _string_metadata_to_description_field(func: Callable[..., Any]) -> Callable[..., Any]:
+    type_hints = get_type_hints(func, include_extras=True)
+
+    for _, annotation in type_hints.items():
+        # Check if the annotation itself has metadata (using __metadata__)
+        if hasattr(annotation, "__metadata__"):
+            metadata = annotation.__metadata__
+            if metadata and isinstance(metadata[0], str):
+                # Replace string metadata with Field
+                annotation.__metadata__ = (Field(description=metadata[0]),)
+        # For Python < 3.11, annotations like `Optional` are stored as `Union`, so metadata
+        # would be in the first element of __args__ (e.g., `__args__[0]` for `int` in `Optional[int]`)
+        elif hasattr(annotation, "__args__") and hasattr(annotation.__args__[0], "__metadata__"):
+            metadata = annotation.__args__[0].__metadata__
+            if metadata and isinstance(metadata[0], str):
+                # Replace string metadata with Field
+                annotation.__args__[0].__metadata__ = (Field(description=metadata[0]),)
+    return func
+
+
+def _fix_staticmethod(f: Callable[..., Any]) -> Callable[..., Any]:
+    # This is a workaround for Python 3.9+ where staticmethod.__func__ is accessible
+    if sys.version_info >= (3, 9) and isinstance(f, staticmethod) and hasattr(f, "__func__"):
+
+        @wraps(f.__func__)
+        def wrapper(*args: Any, **kwargs: Any) -> Any:
+            return f.__func__(*args, **kwargs)  # type: ignore[attr-defined]
+
+        wrapper.__name__ = f.__func__.__name__
+
+        f = wrapper
+    return f
+
+
+def _set_return_annotation_to_any(f: Callable[..., Any]) -> Callable[..., Any]:
+    if inspect.iscoroutinefunction(f):
+
+        @functools.wraps(f)
+        async def _a_wrapped_func(*args: Any, **kwargs: Any) -> Any:
+            return await f(*args, **kwargs)
+
+        wrapped_func = _a_wrapped_func
+
+    else:
+
+        @functools.wraps(f)
+        def _wrapped_func(*args: Any, **kwargs: Any) -> Any:
+            return f(*args, **kwargs)
+
+        wrapped_func = _wrapped_func
+
+    sig = inspect.signature(f)
+
+    # Change the return annotation directly on the signature of the wrapper
+    wrapped_func.__signature__ = sig.replace(return_annotation=Any)  # type: ignore[attr-defined]
+
+    return wrapped_func
+
+
+def inject_params(f: Callable[..., Any]) -> Callable[..., Any]:
+    """Injects parameters into a function, removing injected dependencies from its signature.
+
+    This function is used to modify a function by injecting dependencies and removing
+    injected parameters from the function's signature.
+
+    Args:
+        f: The function to modify with dependency injection.
+
+    Returns:
+        The modified function with injected dependencies and updated signature.
+    """
+    # This is a workaround for Python 3.9+ where staticmethod.__func__ is accessible
+    if sys.version_info >= (3, 9) and isinstance(f, staticmethod) and hasattr(f, "__func__"):
+        f = _fix_staticmethod(f)
+
+    f = _string_metadata_to_description_field(f)
+    f = _set_return_annotation_to_any(f)
+    f = inject(f)
+    f = _remove_injected_params_from_signature(f)
+
+    return f
diff --git a/mm_agents/coact/autogen/tools/experimental/__init__.py b/mm_agents/coact/autogen/tools/experimental/__init__.py
new file mode 100644
index 0000000..0ead373
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/__init__.py
@@ -0,0 +1,48 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .browser_use import BrowserUseTool
+from .crawl4ai import Crawl4AITool
+from .deep_research import DeepResearchTool
+from .duckduckgo import DuckDuckGoSearchTool
+from .google_search import GoogleSearchTool, YoutubeSearchTool
+from .messageplatform import (
+    DiscordRetrieveTool,
+    DiscordSendTool,
+    SlackRetrieveRepliesTool,
+    SlackRetrieveTool,
+    SlackSendTool,
+    TelegramRetrieveTool,
+    TelegramSendTool,
+)
+from .perplexity import PerplexitySearchTool
+from .reliable import ReliableTool, ReliableToolError, SuccessfulExecutionParameters, ToolExecutionDetails
+from .tavily import TavilySearchTool
+from .web_search_preview import WebSearchPreviewTool
+from .wikipedia import WikipediaPageLoadTool, WikipediaQueryRunTool
+
+__all__ = [
+    "BrowserUseTool",
+    "Crawl4AITool",
+    "DeepResearchTool",
+    "DiscordRetrieveTool",
+    "DiscordSendTool",
+    "DuckDuckGoSearchTool",
+    "GoogleSearchTool",
+    "PerplexitySearchTool",
+    "ReliableTool",
+    "ReliableToolError",
+    "SlackRetrieveRepliesTool",
+    "SlackRetrieveTool",
+    "SlackSendTool",
+    "SuccessfulExecutionParameters",
+    "TavilySearchTool",
+    "TelegramRetrieveTool",
+    "TelegramSendTool",
+    "ToolExecutionDetails",
+    "WebSearchPreviewTool",
+    "WikipediaPageLoadTool",
+    "WikipediaQueryRunTool",
+    "YoutubeSearchTool",
+]
diff --git a/mm_agents/coact/autogen/tools/experimental/browser_use/__init__.py b/mm_agents/coact/autogen/tools/experimental/browser_use/__init__.py
new file mode 100644
index 0000000..1700341
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/browser_use/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .browser_use import BrowserUseResult, BrowserUseTool, ExtractedContent
+
+__all__ = ["BrowserUseResult", "BrowserUseTool", "ExtractedContent"]
diff --git a/mm_agents/coact/autogen/tools/experimental/browser_use/browser_use.py b/mm_agents/coact/autogen/tools/experimental/browser_use/browser_use.py
new file mode 100644
index 0000000..4cf120c
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/browser_use/browser_use.py
@@ -0,0 +1,161 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Annotated, Any, Optional, Union
+
+from pydantic import BaseModel, field_validator
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ....llm_config import LLMConfig
+from ... import Depends, Tool
+from ...dependency_injection import on
+
+with optional_import_block():
+    from browser_use import Agent, Controller
+    from browser_use.browser.browser import Browser, BrowserConfig
+
+    from ....interop.langchain.langchain_chat_model_factory import LangChainChatModelFactory
+
+
+__all__ = ["BrowserUseResult", "BrowserUseTool", "ExtractedContent"]
+
+
+@export_module("autogen.tools.experimental.browser_use")
+class ExtractedContent(BaseModel):
+    """Extracted content from the browser.
+
+    Attributes:
+        content: The extracted content.
+        url: The URL of the extracted content
+    """
+
+    content: str
+    url: Optional[str]
+
+    @field_validator("url")
+    @classmethod
+    def check_url(cls, v: str) -> Optional[str]:
+        """Check if the URL is about:blank and return None if it is.
+
+        Args:
+            v: The URL to check.
+        """
+        if v == "about:blank":
+            return None
+        return v
+
+
+@export_module("autogen.tools.experimental.browser_use")
+class BrowserUseResult(BaseModel):
+    """The result of using the browser to perform a task.
+
+    Attributes:
+        extracted_content: List of extracted content.
+        final_result: The final result.
+    """
+
+    extracted_content: list[ExtractedContent]
+    final_result: Optional[str]
+
+
+@require_optional_import(
+    [
+        "langchain_anthropic",
+        "langchain_google_genai",
+        "langchain_ollama",
+        "langchain_openai",
+        "langchain_core",
+        "browser_use",
+    ],
+    "browser-use",
+)
+@export_module("autogen.tools.experimental")
+class BrowserUseTool(Tool):
+    """BrowserUseTool is a tool that uses the browser to perform a task."""
+
+    def __init__(  # type: ignore[no-any-unimported]
+        self,
+        *,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        browser: Optional["Browser"] = None,
+        agent_kwargs: Optional[dict[str, Any]] = None,
+        browser_config: Optional[dict[str, Any]] = None,
+    ):
+        """Use the browser to perform a task.
+
+        Args:
+            llm_config: The LLM configuration.
+            browser: The browser to use. If defined, browser_config must be None
+            agent_kwargs: Additional keyword arguments to pass to the Agent
+            browser_config: The browser configuration to use. If defined, browser must be None
+        """
+        if agent_kwargs is None:
+            agent_kwargs = {}
+
+        if browser_config is None:
+            browser_config = {}
+
+        if browser is not None and browser_config:
+            raise ValueError(
+                f"Cannot provide both browser and additional keyword parameters: {browser=}, {browser_config=}"
+            )
+
+        async def browser_use(  # type: ignore[no-any-unimported]
+            task: Annotated[str, "The task to perform."],
+            llm_config: Annotated[Union[LLMConfig, dict[str, Any]], Depends(on(llm_config))],
+            browser: Annotated[Optional[Browser], Depends(on(browser))],
+            agent_kwargs: Annotated[dict[str, Any], Depends(on(agent_kwargs))],
+            browser_config: Annotated[dict[str, Any], Depends(on(browser_config))],
+        ) -> BrowserUseResult:
+            agent_kwargs = agent_kwargs.copy()
+            browser_config = browser_config.copy()
+            if browser is None:
+                # set default value for headless
+                headless = browser_config.pop("headless", True)
+
+                browser_config = BrowserConfig(headless=headless, **browser_config)
+                browser = Browser(config=browser_config)
+
+            # set default value for generate_gif
+            if "generate_gif" not in agent_kwargs:
+                agent_kwargs["generate_gif"] = False
+
+            llm = LangChainChatModelFactory.create_base_chat_model(llm_config)
+
+            max_steps = agent_kwargs.pop("max_steps", 100)
+
+            agent = Agent(
+                task=task,
+                llm=llm,
+                browser=browser,
+                controller=BrowserUseTool._get_controller(llm_config),
+                **agent_kwargs,
+            )
+
+            result = await agent.run(max_steps=max_steps)
+
+            extracted_content = [
+                ExtractedContent(content=content, url=url)
+                for content, url in zip(result.extracted_content(), result.urls())
+            ]
+            return BrowserUseResult(
+                extracted_content=extracted_content,
+                final_result=result.final_result(),
+            )
+
+        super().__init__(
+            name="browser_use",
+            description="Use the browser to perform a task.",
+            func_or_tool=browser_use,
+        )
+
+    @staticmethod
+    def _get_controller(llm_config: Union[LLMConfig, dict[str, Any]]) -> Any:
+        response_format = (
+            llm_config["config_list"][0].get("response_format", None)
+            if "config_list" in llm_config
+            else llm_config.get("response_format")
+        )
+        return Controller(output_model=response_format)
diff --git a/mm_agents/coact/autogen/tools/experimental/crawl4ai/__init__.py b/mm_agents/coact/autogen/tools/experimental/crawl4ai/__init__.py
new file mode 100644
index 0000000..952f45c
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/crawl4ai/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .crawl4ai import Crawl4AITool
+
+__all__ = ["Crawl4AITool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/crawl4ai/crawl4ai.py b/mm_agents/coact/autogen/tools/experimental/crawl4ai/crawl4ai.py
new file mode 100644
index 0000000..8fabd07
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/crawl4ai/crawl4ai.py
@@ -0,0 +1,153 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Annotated, Any, Optional, Union
+
+from pydantic import BaseModel
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ....interop import LiteLLmConfigFactory
+from ....llm_config import LLMConfig
+from ... import Tool
+from ...dependency_injection import Depends, on
+
+with optional_import_block():
+    from crawl4ai import AsyncWebCrawler, BrowserConfig, CacheMode, CrawlerRunConfig
+    from crawl4ai.extraction_strategy import LLMExtractionStrategy
+
+__all__ = ["Crawl4AITool"]
+
+
+@require_optional_import(["crawl4ai"], "crawl4ai")
+@export_module("autogen.tools.experimental")
+class Crawl4AITool(Tool):
+    """
+    Crawl a website and extract information using the crawl4ai library.
+    """
+
+    def __init__(
+        self,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any]]] = None,
+        extraction_model: Optional[type[BaseModel]] = None,
+        llm_strategy_kwargs: Optional[dict[str, Any]] = None,
+    ) -> None:
+        """
+        Initialize the Crawl4AITool.
+
+        Args:
+            llm_config: The config dictionary for the LLM model. If None, the tool will run without LLM.
+            extraction_model: The Pydantic model to use for extraction. If None, the tool will use the default schema.
+            llm_strategy_kwargs: The keyword arguments to pass to the LLM extraction strategy.
+        """
+        Crawl4AITool._validate_llm_strategy_kwargs(llm_strategy_kwargs, llm_config_provided=(llm_config is not None))
+
+        async def crawl4ai_helper(  # type: ignore[no-any-unimported]
+            url: str,
+            browser_cfg: Optional["BrowserConfig"] = None,
+            crawl_config: Optional["CrawlerRunConfig"] = None,
+        ) -> Any:
+            async with AsyncWebCrawler(config=browser_cfg) as crawler:
+                result = await crawler.arun(
+                    url=url,
+                    config=crawl_config,
+                )
+
+            if crawl_config is None:
+                response = result.markdown
+            else:
+                response = result.extracted_content if result.success else result.error_message
+
+            return response
+
+        async def crawl4ai_without_llm(
+            url: Annotated[str, "The url to crawl and extract information from."],
+        ) -> Any:
+            return await crawl4ai_helper(url=url)
+
+        async def crawl4ai_with_llm(
+            url: Annotated[str, "The url to crawl and extract information from."],
+            instruction: Annotated[str, "The instruction to provide on how and what to extract."],
+            llm_config: Annotated[Any, Depends(on(llm_config))],
+            llm_strategy_kwargs: Annotated[Optional[dict[str, Any]], Depends(on(llm_strategy_kwargs))],
+            extraction_model: Annotated[Optional[type[BaseModel]], Depends(on(extraction_model))],
+        ) -> Any:
+            browser_cfg = BrowserConfig(headless=True)
+            crawl_config = Crawl4AITool._get_crawl_config(
+                llm_config=llm_config,
+                instruction=instruction,
+                extraction_model=extraction_model,
+                llm_strategy_kwargs=llm_strategy_kwargs,
+            )
+
+            return await crawl4ai_helper(url=url, browser_cfg=browser_cfg, crawl_config=crawl_config)
+
+        super().__init__(
+            name="crawl4ai",
+            description="Crawl a website and extract information.",
+            func_or_tool=crawl4ai_without_llm if llm_config is None else crawl4ai_with_llm,
+        )
+
+    @staticmethod
+    def _validate_llm_strategy_kwargs(llm_strategy_kwargs: Optional[dict[str, Any]], llm_config_provided: bool) -> None:
+        if not llm_strategy_kwargs:
+            return
+
+        if not llm_config_provided:
+            raise ValueError("llm_strategy_kwargs can only be provided if llm_config is also provided.")
+
+        check_parameters_error_msg = "".join(
+            f"'{key}' should not be provided in llm_strategy_kwargs. It is automatically set based on llm_config.\n"
+            for key in ["provider", "api_token"]
+            if key in llm_strategy_kwargs
+        )
+
+        check_parameters_error_msg += "".join(
+            "'schema' should not be provided in llm_strategy_kwargs. It is automatically set based on extraction_model type.\n"
+            if "schema" in llm_strategy_kwargs
+            else ""
+        )
+
+        check_parameters_error_msg += "".join(
+            "'instruction' should not be provided in llm_strategy_kwargs. It is provided at the time of calling the tool.\n"
+            if "instruction" in llm_strategy_kwargs
+            else ""
+        )
+
+        if check_parameters_error_msg:
+            raise ValueError(check_parameters_error_msg)
+
+    @staticmethod
+    def _get_crawl_config(  # type: ignore[no-any-unimported]
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        instruction: str,
+        llm_strategy_kwargs: Optional[dict[str, Any]] = None,
+        extraction_model: Optional[type[BaseModel]] = None,
+    ) -> "CrawlerRunConfig":
+        lite_llm_config = LiteLLmConfigFactory.create_lite_llm_config(llm_config)
+
+        if llm_strategy_kwargs is None:
+            llm_strategy_kwargs = {}
+
+        schema = (
+            extraction_model.model_json_schema()
+            if (extraction_model and issubclass(extraction_model, BaseModel))
+            else None
+        )
+
+        extraction_type = llm_strategy_kwargs.pop("extraction_type", "schema" if schema else "block")
+
+        # 1. Define the LLM extraction strategy
+        llm_strategy = LLMExtractionStrategy(
+            **lite_llm_config,
+            schema=schema,
+            extraction_type=extraction_type,
+            instruction=instruction,
+            **llm_strategy_kwargs,
+        )
+
+        # 2. Build the crawler config
+        crawl_config = CrawlerRunConfig(extraction_strategy=llm_strategy, cache_mode=CacheMode.BYPASS)
+
+        return crawl_config
diff --git a/mm_agents/coact/autogen/tools/experimental/deep_research/__init__.py b/mm_agents/coact/autogen/tools/experimental/deep_research/__init__.py
new file mode 100644
index 0000000..04e9393
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/deep_research/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .deep_research import DeepResearchTool
+
+__all__ = ["DeepResearchTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/deep_research/deep_research.py b/mm_agents/coact/autogen/tools/experimental/deep_research/deep_research.py
new file mode 100644
index 0000000..743cb72
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/deep_research/deep_research.py
@@ -0,0 +1,328 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import copy
+from typing import Annotated, Any, Callable, Union
+
+from pydantic import BaseModel, Field
+
+from ....agentchat import ConversableAgent
+from ....doc_utils import export_module
+from ....llm_config import LLMConfig
+from ... import Depends, Tool
+from ...dependency_injection import on
+
+__all__ = ["DeepResearchTool"]
+
+
+class Subquestion(BaseModel):
+    question: Annotated[str, Field(description="The original question.")]
+
+    def format(self) -> str:
+        return f"Question: {self.question}\n"
+
+
+class SubquestionAnswer(Subquestion):
+    answer: Annotated[str, Field(description="The answer to the question.")]
+
+    def format(self) -> str:
+        return f"Question: {self.question}\n{self.answer}\n"
+
+
+class Task(BaseModel):
+    question: Annotated[str, Field(description="The original question.")]
+    subquestions: Annotated[list[Subquestion], Field(description="The subquestions that need to be answered.")]
+
+    def format(self) -> str:
+        return f"Task: {self.question}\n\n" + "\n".join(
+            "Subquestion " + str(i + 1) + ":\n" + subquestion.format()
+            for i, subquestion in enumerate(self.subquestions)
+        )
+
+
+class CompletedTask(BaseModel):
+    question: Annotated[str, Field(description="The original question.")]
+    subquestions: Annotated[list[SubquestionAnswer], Field(description="The subquestions and their answers")]
+
+    def format(self) -> str:
+        return f"Task: {self.question}\n\n" + "\n".join(
+            "Subquestion " + str(i + 1) + ":\n" + subquestion.format()
+            for i, subquestion in enumerate(self.subquestions)
+        )
+
+
+class InformationCrumb(BaseModel):
+    source_url: str
+    source_title: str
+    source_summary: str
+    relevant_info: str
+
+
+class GatheredInformation(BaseModel):
+    information: list[InformationCrumb]
+
+    def format(self) -> str:
+        return "Here is the gathered information: \n" + "\n".join(
+            f"URL: {info.source_url}\nTitle: {info.source_title}\nSummary: {info.source_summary}\nRelevant Information: {info.relevant_info}\n\n"
+            for info in self.information
+        )
+
+
+@export_module("autogen.tools.experimental")
+class DeepResearchTool(Tool):
+    """A tool that delegates a web research task to the subteams of agents."""
+
+    ANSWER_CONFIRMED_PREFIX = "Answer confirmed:"
+
+    def __init__(
+        self,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        max_web_steps: int = 30,
+    ):
+        """Initialize the DeepResearchTool.
+
+        Args:
+            llm_config (LLMConfig, dict[str, Any]): The LLM configuration.
+            max_web_steps (int, optional): The maximum number of web steps. Defaults to 30.
+        """
+        self.llm_config = llm_config
+
+        self.summarizer_agent = ConversableAgent(
+            name="SummarizerAgent",
+            system_message=(
+                "You are an agent with a task of answering the question provided by the user."
+                "First you need to split the question into subquestions by calling the 'split_question_and_answer_subquestions' method."
+                "Then you need to sintesize the answers the original question by combining the answers to the subquestions."
+            ),
+            is_termination_msg=lambda x: x.get("content", "")
+            and x.get("content", "").startswith(self.ANSWER_CONFIRMED_PREFIX),
+            llm_config=llm_config,
+            human_input_mode="NEVER",
+        )
+
+        self.critic_agent = ConversableAgent(
+            name="CriticAgent",
+            system_message=(
+                "You are a critic agent responsible for evaluating the answer provided by the summarizer agent.\n"
+                "Your task is to assess the quality of the answer based on its coherence, relevance, and completeness.\n"
+                "Provide constructive feedback on how the answer can be improved.\n"
+                "If the answer is satisfactory, call the 'confirm_answer' method to end the task.\n"
+            ),
+            is_termination_msg=lambda x: x.get("content", "")
+            and x.get("content", "").startswith(self.ANSWER_CONFIRMED_PREFIX),
+            llm_config=llm_config,
+            human_input_mode="NEVER",
+        )
+
+        def delegate_research_task(
+            task: Annotated[str, "The task to perform a research on."],
+            llm_config: Annotated[Union[LLMConfig, dict[str, Any]], Depends(on(llm_config))],
+            max_web_steps: Annotated[int, Depends(on(max_web_steps))],
+        ) -> str:
+            """Delegate a research task to the agent.
+
+            Args:
+                task (str): The task to perform a research on.
+                llm_config (LLMConfig, dict[str, Any]): The LLM configuration.
+                max_web_steps (int): The maximum number of web steps.
+
+            Returns:
+                str: The answer to the research task.
+            """
+
+            @self.summarizer_agent.register_for_execution()
+            @self.critic_agent.register_for_llm(description="Call this method to confirm the final answer.")
+            def confirm_summary(answer: str, reasoning: str) -> str:
+                return f"{self.ANSWER_CONFIRMED_PREFIX}" + answer + "\nReasoning: " + reasoning
+
+            split_question_and_answer_subquestions = DeepResearchTool._get_split_question_and_answer_subquestions(
+                llm_config=llm_config,
+                max_web_steps=max_web_steps,
+            )
+
+            self.summarizer_agent.register_for_llm(description="Split the question into subquestions and get answers.")(
+                split_question_and_answer_subquestions
+            )
+            self.critic_agent.register_for_execution()(split_question_and_answer_subquestions)
+
+            result = self.critic_agent.initiate_chat(
+                self.summarizer_agent,
+                message="Please answer the following question: " + task,
+                # This outer chat should preserve the history of the conversation
+                clear_history=False,
+            )
+
+            return result.summary
+
+        super().__init__(
+            name=delegate_research_task.__name__,
+            description="Delegate a research task to the deep research agent.",
+            func_or_tool=delegate_research_task,
+        )
+
+    SUBQUESTIONS_ANSWER_PREFIX = "Subquestions answered:"
+
+    @staticmethod
+    def _get_split_question_and_answer_subquestions(
+        llm_config: Union[LLMConfig, dict[str, Any]], max_web_steps: int
+    ) -> Callable[..., Any]:
+        def split_question_and_answer_subquestions(
+            question: Annotated[str, "The question to split and answer."],
+            llm_config: Annotated[Union[LLMConfig, dict[str, Any]], Depends(on(llm_config))],
+            max_web_steps: Annotated[int, Depends(on(max_web_steps))],
+        ) -> str:
+            decomposition_agent = ConversableAgent(
+                name="DecompositionAgent",
+                system_message=(
+                    "You are an expert at breaking down complex questions into smaller, focused subquestions.\n"
+                    "Your task is to take any question provided and divide it into clear, actionable subquestions that can be individually answered.\n"
+                    "Ensure the subquestions are logical, non-redundant, and cover all key aspects of the original question.\n"
+                    "Avoid providing answers or interpretations—focus solely on decomposition.\n"
+                    "Do not include banal, general knowledge questions\n"
+                    "Do not include questions that go into unnecessary detail that is not relevant to the original question\n"
+                    "Do not include question that require knowledge of the original or other subquestions to answer\n"
+                    "Some rule of thumb is to have only one subquestion for easy questions, 3 for medium questions, and 5 for hard questions.\n"
+                ),
+                llm_config=llm_config,
+                is_termination_msg=lambda x: x.get("content", "")
+                and x.get("content", "").startswith(DeepResearchTool.SUBQUESTIONS_ANSWER_PREFIX),
+                human_input_mode="NEVER",
+            )
+
+            example_task = Task(
+                question="What is the capital of France?",
+                subquestions=[Subquestion(question="What is the capital of France?")],
+            )
+            decomposition_critic = ConversableAgent(
+                name="DecompositionCritic",
+                system_message=(
+                    "You are a critic agent responsible for evaluating the subquestions provided by the initial analysis agent.\n"
+                    "You need to confirm whether the subquestions are clear, actionable, and cover all key aspects of the original question.\n"
+                    "Do not accept redundant or unnecessary subquestions, focus solely on the minimal viable subset of subqestions necessary to answer the original question. \n"
+                    "Do not accept banal, general knowledge questions\n"
+                    "Do not accept questions that go into unnecessary detail that is not relevant to the original question\n"
+                    "Remove questions that can be answered with combining knowledge from other questions\n"
+                    "After you are satisfied with the subquestions, call the 'generate_subquestions' method to answer each subquestion.\n"
+                    "This is an example of an argument that can be passed to the 'generate_subquestions' method:\n"
+                    f"{{'task': {example_task.model_dump()}}}\n"
+                    "Some rule of thumb is to have only one subquestion for easy questions, 3 for medium questions, and 5 for hard questions.\n"
+                ),
+                llm_config=llm_config,
+                is_termination_msg=lambda x: x.get("content", "")
+                and x.get("content", "").startswith(DeepResearchTool.SUBQUESTIONS_ANSWER_PREFIX),
+                human_input_mode="NEVER",
+            )
+
+            generate_subquestions = DeepResearchTool._get_generate_subquestions(
+                llm_config=llm_config, max_web_steps=max_web_steps
+            )
+            decomposition_agent.register_for_execution()(generate_subquestions)
+            decomposition_critic.register_for_llm(description="Generate subquestions for a task.")(
+                generate_subquestions
+            )
+
+            result = decomposition_critic.initiate_chat(
+                decomposition_agent,
+                message="Analyse and gather subqestions for the following question: " + question,
+            )
+
+            return result.summary
+
+        return split_question_and_answer_subquestions
+
+    @staticmethod
+    def _get_generate_subquestions(
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        max_web_steps: int,
+    ) -> Callable[..., str]:
+        """Get the generate_subquestions method.
+
+        Args:
+            llm_config (Union[LLMConfig, dict[str, Any]]): The LLM configuration.
+            max_web_steps (int): The maximum number of web steps.
+
+        Returns:
+            Callable[..., str]: The generate_subquestions method.
+        """
+
+        def generate_subquestions(
+            task: Task,
+            llm_config: Annotated[Union[LLMConfig, dict[str, Any]], Depends(on(llm_config))],
+            max_web_steps: Annotated[int, Depends(on(max_web_steps))],
+        ) -> str:
+            if not task.subquestions:
+                task.subquestions = [Subquestion(question=task.question)]
+
+            subquestions_answers: list[SubquestionAnswer] = []
+            for subquestion in task.subquestions:
+                answer = DeepResearchTool._answer_question(
+                    subquestion.question, llm_config=llm_config, max_web_steps=max_web_steps
+                )
+                subquestions_answers.append(SubquestionAnswer(question=subquestion.question, answer=answer))
+
+            completed_task = CompletedTask(question=task.question, subquestions=subquestions_answers)
+
+            return f"{DeepResearchTool.SUBQUESTIONS_ANSWER_PREFIX} \n" + completed_task.format()
+
+        return generate_subquestions
+
+    @staticmethod
+    def _answer_question(
+        question: str,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        max_web_steps: int,
+    ) -> str:
+        from ....agents.experimental.websurfer import WebSurferAgent
+
+        websurfer_config = copy.deepcopy(llm_config)
+
+        websurfer_config["config_list"][0]["response_format"] = GatheredInformation
+
+        def is_termination_msg(x: dict[str, Any]) -> bool:
+            content = x.get("content", "")
+            return (content is not None) and content.startswith(DeepResearchTool.ANSWER_CONFIRMED_PREFIX)
+
+        websurfer_agent = WebSurferAgent(
+            llm_config=llm_config,
+            web_tool_llm_config=websurfer_config,
+            name="WebSurferAgent",
+            system_message=(
+                "You are a web surfer agent responsible for gathering information from the web to provide information for answering a question\n"
+                "You will be asked to find information related to the question and provide a summary of the information gathered.\n"
+                "The summary should include the URL, title, summary, and relevant information for each piece of information gathered.\n"
+            ),
+            is_termination_msg=is_termination_msg,
+            human_input_mode="NEVER",
+            web_tool_kwargs={
+                "agent_kwargs": {"max_steps": max_web_steps},
+            },
+        )
+
+        websurfer_critic = ConversableAgent(
+            name="WebSurferCritic",
+            system_message=(
+                "You are a critic agent responsible for evaluating the answer provided by the web surfer agent.\n"
+                "You need to confirm whether the information provided by the websurfer is correct and sufficient to answer the question.\n"
+                "You can ask the web surfer to provide more information or provide and confirm the answer.\n"
+            ),
+            llm_config=llm_config,
+            is_termination_msg=is_termination_msg,
+            human_input_mode="NEVER",
+        )
+
+        @websurfer_agent.register_for_execution()
+        @websurfer_critic.register_for_llm(
+            description="Call this method when you agree that the original question can be answered with the gathered information and provide the answer."
+        )
+        def confirm_answer(answer: str) -> str:
+            return f"{DeepResearchTool.ANSWER_CONFIRMED_PREFIX} " + answer
+
+        websurfer_critic.register_for_execution()(websurfer_agent.tool)
+
+        result = websurfer_critic.initiate_chat(
+            websurfer_agent,
+            message="Please find the answer to this question: " + question,
+        )
+
+        return result.summary
diff --git a/mm_agents/coact/autogen/tools/experimental/duckduckgo/__init__.py b/mm_agents/coact/autogen/tools/experimental/duckduckgo/__init__.py
new file mode 100644
index 0000000..372c9da
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/duckduckgo/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .duckduckgo_search import DuckDuckGoSearchTool
+
+__all__ = ["DuckDuckGoSearchTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/duckduckgo/duckduckgo_search.py b/mm_agents/coact/autogen/tools/experimental/duckduckgo/duckduckgo_search.py
new file mode 100644
index 0000000..b194d35
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/duckduckgo/duckduckgo_search.py
@@ -0,0 +1,109 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+from typing import Annotated, Any
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ... import Tool
+
+with optional_import_block():
+    from duckduckgo_search import DDGS
+
+
+@require_optional_import(
+    [
+        "duckduckgo_search",
+    ],
+    "duckduckgo_search",
+)
+def _execute_duckduckgo_query(
+    query: str,
+    num_results: int = 5,
+) -> list[dict[str, Any]]:
+    """
+    Execute a search query using the DuckDuckGo Search API.
+
+    Args:
+        query (str): The search query string.
+        num_results (int, optional): The maximum number of results to return. Defaults to 5.
+
+    Returns:
+        list[dict[str, Any]]: A list of search results from the DuckDuckGo API.
+    """
+    with DDGS() as ddgs:
+        try:
+            # region='wt-wt' means worldwide
+            results = list(ddgs.text(query, region="wt-wt", max_results=num_results))
+        except Exception as e:
+            print(f"DuckDuckGo Search failed: {e}")
+            results = []
+    return results
+
+
+def _duckduckgo_search(
+    query: str,
+    num_results: int = 5,
+) -> list[dict[str, Any]]:
+    """
+    Perform a DuckDuckGo search and format the results.
+
+    This function takes search parameters, executes the query using `_execute_duckduckgo_query`,
+    and formats the results into a list of dictionaries containing title, link, and snippet.
+
+    Args:
+        query (str): The search query string.
+        num_results (int, optional): The maximum number of results to return. Defaults to 5.
+
+    Returns:
+        list[dict[str, Any]]: A list of dictionaries, where each dictionary represents a search result
+            with keys 'title', 'link', and 'snippet'. Returns an empty list if no results are found.
+    """
+    res = _execute_duckduckgo_query(
+        query=query,
+        num_results=num_results,
+    )
+
+    return [
+        {"title": item.get("title", ""), "link": item.get("href", ""), "snippet": item.get("body", "")} for item in res
+    ]
+
+
+@export_module("autogen.tools.experimental")
+class DuckDuckGoSearchTool(Tool):
+    """
+    DuckDuckGoSearchTool is a tool that uses DuckDuckGo to perform a search.
+
+    This tool allows agents to leverage the DuckDuckGo search engine for information retrieval.
+    DuckDuckGo does not require an API key, making it easy to use.
+    """
+
+    def __init__(self) -> None:
+        """
+        Initializes the DuckDuckGoSearchTool.
+        """
+
+        def duckduckgo_search(
+            query: Annotated[str, "The search query."],
+            num_results: Annotated[int, "The number of results to return."] = 5,
+        ) -> list[dict[str, Any]]:
+            """
+            Performs a search using the DuckDuckGo Search API and returns formatted results.
+
+            Args:
+                query: The search query string.
+                num_results: The maximum number of results to return. Defaults to 5.
+
+            Returns:
+                A list of dictionaries, each containing 'title', 'link', and 'snippet' of a search result.
+            """
+            return _duckduckgo_search(
+                query=query,
+                num_results=num_results,
+            )
+
+        super().__init__(
+            name="duckduckgo_search",
+            description="Use the DuckDuckGo Search API to perform a search.",
+            func_or_tool=duckduckgo_search,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/google/__init__.py b/mm_agents/coact/autogen/tools/experimental/google/__init__.py
new file mode 100644
index 0000000..a0ddbf7
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/__init__.py
@@ -0,0 +1,14 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .authentication import GoogleCredentialsLocalProvider, GoogleCredentialsProvider
+from .drive import GoogleDriveToolkit
+from .toolkit_protocol import GoogleToolkitProtocol
+
+__all__ = [
+    "GoogleCredentialsLocalProvider",
+    "GoogleCredentialsProvider",
+    "GoogleDriveToolkit",
+    "GoogleToolkitProtocol",
+]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/authentication/__init__.py b/mm_agents/coact/autogen/tools/experimental/google/authentication/__init__.py
new file mode 100644
index 0000000..5b3c91f
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/authentication/__init__.py
@@ -0,0 +1,11 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .credentials_local_provider import GoogleCredentialsLocalProvider
+from .credentials_provider import GoogleCredentialsProvider
+
+__all__ = [
+    "GoogleCredentialsLocalProvider",
+    "GoogleCredentialsProvider",
+]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_hosted_provider.py b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_hosted_provider.py
new file mode 100644
index 0000000..73fd934
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_hosted_provider.py
@@ -0,0 +1,43 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block
+from .credentials_provider import GoogleCredentialsProvider
+
+with optional_import_block():
+    from google.oauth2.credentials import Credentials
+
+
+__all__ = ["GoogleCredenentialsHostedProvider"]
+
+
+@export_module("autogen.tools.experimental.google.authentication")
+class GoogleCredenentialsHostedProvider(GoogleCredentialsProvider):
+    def __init__(
+        self,
+        host: str,
+        port: int = 8080,
+        *,
+        kwargs: dict[str, str],
+    ) -> None:
+        self._host = host
+        self._port = port
+        self._kwargs = kwargs
+
+        raise NotImplementedError("This class is not implemented yet.")
+
+    @property
+    def host(self) -> str:
+        """The host from which to get the credentials."""
+        return self._host
+
+    @property
+    def port(self) -> int:
+        """The port from which to get the credentials."""
+        return self._port
+
+    def get_credentials(self) -> "Credentials":  # type: ignore[no-any-unimported]
+        raise NotImplementedError("This class is not implemented yet.")
diff --git a/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_local_provider.py b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_local_provider.py
new file mode 100644
index 0000000..420f054
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_local_provider.py
@@ -0,0 +1,91 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import os
+from typing import Optional
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block, require_optional_import
+from .credentials_provider import GoogleCredentialsProvider
+
+with optional_import_block():
+    from google.auth.transport.requests import Request
+    from google.oauth2.credentials import Credentials
+    from google_auth_oauthlib.flow import InstalledAppFlow
+
+
+__all__ = ["GoogleCredentialsLocalProvider"]
+
+
+@export_module("autogen.tools.experimental.google.authentication")
+class GoogleCredentialsLocalProvider(GoogleCredentialsProvider):
+    def __init__(
+        self,
+        client_secret_file: str,
+        scopes: list[str],  # e.g. ['https://www.googleapis.com/auth/drive/readonly']
+        token_file: Optional[str] = None,
+        port: int = 8080,
+    ) -> None:
+        """A Google credentials provider that gets the credentials locally.
+
+        Args:
+            client_secret_file (str): The path to the client secret file.
+            scopes (list[str]): The scopes to request.
+            token_file (str): Optional path to the token file. If not provided, the token will not be saved.
+            port (int): The port from which to get the credentials.
+        """
+        self.client_secret_file = client_secret_file
+        self.scopes = scopes
+        self.token_file = token_file
+        self._port = port
+
+    @property
+    def host(self) -> str:
+        """Localhost is the default host."""
+        return "localhost"
+
+    @property
+    def port(self) -> int:
+        """The port from which to get the credentials."""
+        return self._port
+
+    @require_optional_import(
+        [
+            "google_auth_httplib2",
+            "google_auth_oauthlib",
+        ],
+        "google-api",
+    )
+    def _refresh_or_get_new_credentials(self, creds: Optional["Credentials"]) -> "Credentials":  # type: ignore[no-any-unimported]
+        if creds and creds.expired and creds.refresh_token:
+            creds.refresh(Request())  # type: ignore[no-untyped-call]
+        else:
+            flow = InstalledAppFlow.from_client_secrets_file(self.client_secret_file, self.scopes)
+            creds = flow.run_local_server(host=self.host, port=self.port)
+        return creds  # type: ignore[return-value]
+
+    @require_optional_import(
+        [
+            "google_auth_httplib2",
+            "google_auth_oauthlib",
+        ],
+        "google-api",
+    )
+    def get_credentials(self) -> "Credentials":  # type: ignore[no-any-unimported]
+        """Get the Google credentials."""
+        creds = None
+        if self.token_file and os.path.exists(self.token_file):
+            creds = Credentials.from_authorized_user_file(self.token_file)  # type: ignore[no-untyped-call]
+
+        # If there are no (valid) credentials available, let the user log in.
+        if not creds or not creds.valid:
+            creds = self._refresh_or_get_new_credentials(creds)
+
+            if self.token_file:
+                # Save the credentials for the next run
+                with open(self.token_file, "w") as token:
+                    token.write(creds.to_json())  # type: ignore[no-untyped-call]
+
+        return creds  # type: ignore[no-any-return]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_provider.py b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_provider.py
new file mode 100644
index 0000000..d4c76cf
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/authentication/credentials_provider.py
@@ -0,0 +1,35 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+from typing import Optional, Protocol, runtime_checkable
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block
+
+with optional_import_block():
+    from google.oauth2.credentials import Credentials
+
+
+__all__ = ["GoogleCredentialsProvider"]
+
+
+@runtime_checkable
+@export_module("autogen.tools.experimental.google.authentication")
+class GoogleCredentialsProvider(Protocol):
+    """A protocol for Google credentials provider."""
+
+    def get_credentials(self) -> Optional["Credentials"]:  # type: ignore[no-any-unimported]
+        """Get the Google credentials."""
+        ...
+
+    @property
+    def host(self) -> str:
+        """The host from which to get the credentials."""
+        ...
+
+    @property
+    def port(self) -> int:
+        """The port from which to get the credentials."""
+        ...
diff --git a/mm_agents/coact/autogen/tools/experimental/google/drive/__init__.py b/mm_agents/coact/autogen/tools/experimental/google/drive/__init__.py
new file mode 100644
index 0000000..7d1aeec
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/drive/__init__.py
@@ -0,0 +1,9 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .toolkit import GoogleDriveToolkit
+
+__all__ = [
+    "GoogleDriveToolkit",
+]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/drive/drive_functions.py b/mm_agents/coact/autogen/tools/experimental/google/drive/drive_functions.py
new file mode 100644
index 0000000..0a64b74
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/drive/drive_functions.py
@@ -0,0 +1,124 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import io
+from pathlib import Path
+from typing import Any, Optional
+
+from .....import_utils import optional_import_block, require_optional_import
+from ..model import GoogleFileInfo
+
+with optional_import_block():
+    from googleapiclient.http import MediaIoBaseDownload
+
+
+__all__ = [
+    "download_file",
+    "list_files_and_folders",
+]
+
+
+@require_optional_import(
+    [
+        "googleapiclient",
+    ],
+    "google-api",
+)
+def list_files_and_folders(service: Any, page_size: int, folder_id: Optional[str]) -> list[GoogleFileInfo]:
+    kwargs = {
+        "pageSize": page_size,
+        "fields": "nextPageToken, files(id, name, mimeType)",
+    }
+    if folder_id:
+        kwargs["q"] = f"'{folder_id}' in parents and trashed=false"  # Search for files in the folder
+    response = service.files().list(**kwargs).execute()
+    result = response.get("files", [])
+    if not isinstance(result, list):
+        raise ValueError(f"Expected a list of files, but got {result}")
+    result = [GoogleFileInfo(**file_info) for file_info in result]
+    return result
+
+
+def _get_file_extension(mime_type: str) -> Optional[str]:
+    """Returns the correct file extension for a given MIME type."""
+    mime_extensions = {
+        "application/vnd.google-apps.document": "docx",  # Google Docs → Word
+        "application/vnd.google-apps.spreadsheet": "csv",  # Google Sheets → CSV
+        "application/vnd.google-apps.presentation": "pptx",  # Google Slides → PowerPoint
+        "video/quicktime": "mov",
+        "application/vnd.google.colaboratory": "ipynb",
+        "application/pdf": "pdf",
+        "image/jpeg": "jpg",
+        "image/png": "png",
+        "text/plain": "txt",
+        "application/zip": "zip",
+    }
+
+    return mime_extensions.get(mime_type)
+
+
+@require_optional_import(
+    [
+        "googleapiclient",
+    ],
+    "google-api",
+)
+def download_file(
+    service: Any,
+    file_id: str,
+    file_name: str,
+    mime_type: str,
+    download_folder: Path,
+    subfolder_path: Optional[str] = None,
+) -> str:
+    """Download or export file based on its MIME type, optionally saving to a subfolder."""
+    file_extension = _get_file_extension(mime_type)
+    if file_extension and (not file_name.lower().endswith(file_extension.lower())):
+        file_name = f"{file_name}.{file_extension}"
+
+    # Define export formats for Google Docs, Sheets, and Slides
+    export_mime_types = {
+        "application/vnd.google-apps.document": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",  # Google Docs → Word
+        "application/vnd.google-apps.spreadsheet": "text/csv",  # Google Sheets → CSV
+        "application/vnd.google-apps.presentation": "application/vnd.openxmlformats-officedocument.presentationml.presentation",  # Google Slides → PowerPoint
+    }
+
+    # Google Docs, Sheets, and Slides cannot be downloaded directly using service.files().get_media() because they are Google-native files
+    if mime_type in export_mime_types:
+        request = service.files().export(fileId=file_id, mimeType=export_mime_types[mime_type])
+    else:
+        # Download normal files (videos, images, etc.)
+        request = service.files().get_media(fileId=file_id)
+
+    # Determine the final destination directory
+    destination_dir = download_folder
+    if subfolder_path:
+        destination_dir = download_folder / subfolder_path
+        # Ensure the subfolder exists, create it if necessary
+        destination_dir.mkdir(parents=True, exist_ok=True)
+
+    # Construct the full path for the file
+    file_path = destination_dir / file_name
+
+    # Save file
+    try:
+        with io.BytesIO() as buffer:
+            downloader = MediaIoBaseDownload(buffer, request)
+            done = False
+            while not done:
+                _, done = downloader.next_chunk()
+
+            buffer.seek(0)
+
+            with open(file_path, "wb") as f:
+                f.write(buffer.getvalue())
+
+        # Print out the relative path of the downloaded file
+        relative_path = Path(subfolder_path) / file_name if subfolder_path else Path(file_name)
+        return f"✅ Downloaded: {relative_path}"
+
+    except Exception as e:
+        # Error message if unable to download
+        relative_path = Path(subfolder_path) / file_name if subfolder_path else Path(file_name)
+        return f"❌ FAILED to download {relative_path}: {e}"
diff --git a/mm_agents/coact/autogen/tools/experimental/google/drive/toolkit.py b/mm_agents/coact/autogen/tools/experimental/google/drive/toolkit.py
new file mode 100644
index 0000000..e183623
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/drive/toolkit.py
@@ -0,0 +1,88 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from pathlib import Path
+from typing import Annotated, Literal, Optional, Union
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block
+from .... import Toolkit, tool
+from ..model import GoogleFileInfo
+from ..toolkit_protocol import GoogleToolkitProtocol
+from .drive_functions import download_file, list_files_and_folders
+
+with optional_import_block():
+    from google.oauth2.credentials import Credentials
+    from googleapiclient.discovery import build
+
+__all__ = [
+    "GoogleDriveToolkit",
+]
+
+
+@export_module("autogen.tools.experimental.google.drive")
+class GoogleDriveToolkit(Toolkit, GoogleToolkitProtocol):
+    """A tool map for Google Drive."""
+
+    def __init__(  # type: ignore[no-any-unimported]
+        self,
+        *,
+        credentials: "Credentials",
+        download_folder: Union[Path, str],
+        exclude: Optional[list[Literal["list_drive_files_and_folders", "download_file_from_drive"]]] = None,
+        api_version: str = "v3",
+    ) -> None:
+        """Initialize the Google Drive tool map.
+
+        Args:
+            credentials: The Google OAuth2 credentials.
+            download_folder: The folder to download files to.
+            exclude: The tool names to exclude.
+            api_version: The Google Drive API version to use."
+        """
+        self.service = build(serviceName="drive", version=api_version, credentials=credentials)
+
+        if isinstance(download_folder, str):
+            download_folder = Path(download_folder)
+        download_folder.mkdir(parents=True, exist_ok=True)
+
+        @tool(description="List files and folders in a Google Drive")
+        def list_drive_files_and_folders(
+            page_size: Annotated[int, "The number of files to list per page."] = 10,
+            folder_id: Annotated[
+                Optional[str],
+                "The ID of the folder to list files from. If not provided, lists all files in the root folder.",
+            ] = None,
+        ) -> list[GoogleFileInfo]:
+            return list_files_and_folders(service=self.service, page_size=page_size, folder_id=folder_id)
+
+        @tool(description="download a file from Google Drive")
+        def download_file_from_drive(
+            file_info: Annotated[GoogleFileInfo, "The file info to download."],
+            subfolder_path: Annotated[
+                Optional[str],
+                "The subfolder path to save the file in. If not provided, saves in the main download folder.",
+            ] = None,
+        ) -> str:
+            return download_file(
+                service=self.service,
+                file_id=file_info.id,
+                file_name=file_info.name,
+                mime_type=file_info.mime_type,
+                download_folder=download_folder,
+                subfolder_path=subfolder_path,
+            )
+
+        if exclude is None:
+            exclude = []
+
+        tools = [tool for tool in [list_drive_files_and_folders, download_file_from_drive] if tool.name not in exclude]
+        super().__init__(tools=tools)
+
+    @classmethod
+    def recommended_scopes(cls) -> list[str]:
+        """Return the recommended scopes manatory for using tools from this tool map."""
+        return [
+            "https://www.googleapis.com/auth/drive.readonly",
+        ]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/model.py b/mm_agents/coact/autogen/tools/experimental/google/model.py
new file mode 100644
index 0000000..ef45a85
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/model.py
@@ -0,0 +1,17 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Annotated
+
+from pydantic import BaseModel, Field
+
+__all__ = [
+    "GoogleFileInfo",
+]
+
+
+class GoogleFileInfo(BaseModel):
+    name: Annotated[str, Field(description="The name of the file.")]
+    id: Annotated[str, Field(description="The ID of the file.")]
+    mime_type: Annotated[str, Field(alias="mimeType", description="The MIME type of the file.")]
diff --git a/mm_agents/coact/autogen/tools/experimental/google/toolkit_protocol.py b/mm_agents/coact/autogen/tools/experimental/google/toolkit_protocol.py
new file mode 100644
index 0000000..9e51be5
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google/toolkit_protocol.py
@@ -0,0 +1,19 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Protocol, runtime_checkable
+
+__all__ = [
+    "GoogleToolkitProtocol",
+]
+
+
+@runtime_checkable
+class GoogleToolkitProtocol(Protocol):
+    """A protocol for Google tool maps."""
+
+    @classmethod
+    def recommended_scopes(cls) -> list[str]:
+        """Defines a required static method without implementation."""
+        ...
diff --git a/mm_agents/coact/autogen/tools/experimental/google_search/__init__.py b/mm_agents/coact/autogen/tools/experimental/google_search/__init__.py
new file mode 100644
index 0000000..dfc2d9c
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google_search/__init__.py
@@ -0,0 +1,8 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .google_search import GoogleSearchTool
+from .youtube_search import YoutubeSearchTool
+
+__all__ = ["GoogleSearchTool", "YoutubeSearchTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/google_search/google_search.py b/mm_agents/coact/autogen/tools/experimental/google_search/google_search.py
new file mode 100644
index 0000000..e49f49b
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google_search/google_search.py
@@ -0,0 +1,93 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import logging
+from typing import Annotated, Any, Optional
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ... import Depends, Tool
+from ...dependency_injection import on
+
+with optional_import_block():
+    from googleapiclient.discovery import build
+
+
+@require_optional_import(
+    [
+        "googleapiclient",
+    ],
+    "google-search",
+)
+def _execute_query(query: str, search_api_key: str, search_engine_id: str, num_results: int) -> Any:
+    service = build("customsearch", "v1", developerKey=search_api_key)
+    return service.cse().list(q=query, cx=search_engine_id, num=num_results).execute()
+
+
+def _google_search(
+    query: str,
+    search_api_key: str,
+    search_engine_id: str,
+    num_results: int,
+) -> list[dict[str, Any]]:
+    res = _execute_query(
+        query=query, search_api_key=search_api_key, search_engine_id=search_engine_id, num_results=num_results
+    )
+
+    return [
+        {"title": item.get("title", ""), "link": item.get("link", ""), "snippet": item.get("snippet", "")}
+        for item in res.get("items", [])
+    ]
+
+
+@export_module("autogen.tools.experimental")
+class GoogleSearchTool(Tool):
+    """GoogleSearchTool is a tool that uses the Google Search API to perform a search."""
+
+    def __init__(
+        self,
+        *,
+        search_api_key: Optional[str] = None,
+        search_engine_id: Optional[str] = None,
+        use_internal_llm_tool_if_available: bool = True,
+    ):
+        """GoogleSearchTool is a tool that uses the Google Search API to perform a search.
+
+        Args:
+            search_api_key: The API key for the Google Search API.
+            search_engine_id: The search engine ID for the Google Search API.
+            use_internal_llm_tool_if_available: Whether to use the predefined (e.g. Gemini GenaAI) search tool. Currently, this can only be used for agents with the Gemini (GenAI) configuration.
+        """
+        self.search_api_key = search_api_key
+        self.search_engine_id = search_engine_id
+        self.use_internal_llm_tool_if_available = use_internal_llm_tool_if_available
+
+        if not use_internal_llm_tool_if_available and (search_api_key is None or search_engine_id is None):
+            raise ValueError(
+                "search_api_key and search_engine_id must be provided if use_internal_llm_tool_if_available is False"
+            )
+
+        if use_internal_llm_tool_if_available and (search_api_key is not None or search_engine_id is not None):
+            logging.warning("search_api_key and search_engine_id will be ignored if internal LLM tool is available")
+
+        def google_search(
+            query: Annotated[str, "The search query."],
+            search_api_key: Annotated[Optional[str], Depends(on(search_api_key))],
+            search_engine_id: Annotated[Optional[str], Depends(on(search_engine_id))],
+            num_results: Annotated[int, "The number of results to return."] = 10,
+        ) -> list[dict[str, Any]]:
+            if search_api_key is None or search_engine_id is None:
+                raise ValueError(
+                    "Your LLM is not configured to use prebuilt google-search tool.\n"
+                    "Please provide search_api_key and search_engine_id.\n"
+                )
+            return _google_search(query, search_api_key, search_engine_id, num_results)
+
+        super().__init__(
+            # GeminiClient will look for a tool with the name "prebuilt_google_search"
+            name="prebuilt_google_search" if use_internal_llm_tool_if_available else "google_search",
+            description="Use the Google Search API to perform a search.",
+            func_or_tool=google_search,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/google_search/youtube_search.py b/mm_agents/coact/autogen/tools/experimental/google_search/youtube_search.py
new file mode 100644
index 0000000..cb979f9
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/google_search/youtube_search.py
@@ -0,0 +1,181 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import logging
+from typing import Annotated, Any, Dict, List, Optional
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ... import Depends, Tool
+from ...dependency_injection import on
+
+with optional_import_block():
+    import googleapiclient.errors
+    from googleapiclient.discovery import build
+
+
+@require_optional_import(
+    ["googleapiclient"],
+    "google-search",
+)
+def _execute_search_query(query: str, youtube_api_key: str, max_results: int) -> Any:
+    """Execute a YouTube search query using the YouTube Data API.
+
+    Args:
+        query: The search query string.
+        youtube_api_key: The API key for the YouTube Data API.
+        max_results: The maximum number of results to return.
+
+    Returns:
+        The search response from the YouTube Data API.
+    """
+    youtube = build("youtube", "v3", developerKey=youtube_api_key)
+
+    try:
+        search_response = (
+            youtube.search().list(q=query, part="id,snippet", maxResults=max_results, type="video").execute()
+        )
+
+        return search_response
+    except googleapiclient.errors.HttpError as e:
+        logging.error(f"An HTTP error occurred: {e}")
+        raise
+
+
+@require_optional_import(
+    ["googleapiclient"],
+    "google-search",
+)
+def _get_video_details(video_ids: List[str], youtube_api_key: str) -> Any:
+    """Get detailed information about specific YouTube videos.
+
+    Args:
+        video_ids: List of YouTube video IDs.
+        youtube_api_key: The API key for the YouTube Data API.
+
+    Returns:
+        The video details response from the YouTube Data API.
+    """
+    if not video_ids:
+        return {"items": []}
+
+    youtube = build("youtube", "v3", developerKey=youtube_api_key)
+
+    try:
+        videos_response = (
+            youtube.videos().list(id=",".join(video_ids), part="snippet,contentDetails,statistics").execute()
+        )
+
+        return videos_response
+    except googleapiclient.errors.HttpError as e:
+        logging.error(f"An HTTP error occurred: {e}")
+        raise
+
+
+def _youtube_search(
+    query: str,
+    youtube_api_key: str,
+    max_results: int,
+    include_video_details: bool = True,
+) -> List[Dict[str, Any]]:
+    """Search YouTube videos based on a query.
+
+    Args:
+        query: The search query string.
+        youtube_api_key: The API key for the YouTube Data API.
+        max_results: The maximum number of results to return.
+        include_video_details: Whether to include detailed video information.
+
+    Returns:
+        A list of dictionaries containing information about the videos.
+    """
+    search_response = _execute_search_query(query=query, youtube_api_key=youtube_api_key, max_results=max_results)
+
+    results = []
+    video_ids = []
+
+    # Extract basic info from search results
+    for item in search_response.get("items", []):
+        if item["id"]["kind"] == "youtube#video":
+            video_ids.append(item["id"]["videoId"])
+            video_info = {
+                "title": item["snippet"]["title"],
+                "description": item["snippet"]["description"],
+                "publishedAt": item["snippet"]["publishedAt"],
+                "channelTitle": item["snippet"]["channelTitle"],
+                "videoId": item["id"]["videoId"],
+                "url": f"https://www.youtube.com/watch?v={item['id']['videoId']}",
+            }
+            results.append(video_info)
+
+    # If detailed info requested, get it
+    if include_video_details and video_ids:
+        video_details = _get_video_details(video_ids, youtube_api_key)
+
+        # Create a mapping of videoId to details
+        details_map = {item["id"]: item for item in video_details.get("items", [])}
+
+        # Update results with additional details
+        for result in results:
+            video_id = result["videoId"]
+            if video_id in details_map:
+                details = details_map[video_id]
+                result.update({
+                    "viewCount": details["statistics"].get("viewCount"),
+                    "likeCount": details["statistics"].get("likeCount"),
+                    "commentCount": details["statistics"].get("commentCount"),
+                    "duration": details["contentDetails"].get("duration"),
+                    "definition": details["contentDetails"].get("definition"),
+                })
+
+    return results
+
+
+@export_module("autogen.tools.experimental")
+class YoutubeSearchTool(Tool):
+    """YoutubeSearchTool is a tool that uses the YouTube Data API to search for videos."""
+
+    def __init__(
+        self,
+        *,
+        youtube_api_key: Optional[str] = None,
+    ):
+        """Initialize a YouTube search tool.
+
+        Args:
+            youtube_api_key: The API key for the YouTube Data API.
+        """
+        self.youtube_api_key = youtube_api_key
+
+        if youtube_api_key is None:
+            raise ValueError("youtube_api_key must be provided")
+
+        def youtube_search(
+            query: Annotated[str, "The search query for YouTube videos."],
+            youtube_api_key: Annotated[str, Depends(on(youtube_api_key))],
+            max_results: Annotated[int, "The maximum number of results to return."] = 5,
+            include_video_details: Annotated[bool, "Whether to include detailed video information."] = True,
+        ) -> List[Dict[str, Any]]:
+            """Search for YouTube videos based on a query.
+
+            Args:
+                query: The search query string.
+                youtube_api_key: The API key for the YouTube Data API.
+                max_results: The maximum number of results to return.
+                include_video_details: Whether to include detailed video information.
+
+            Returns:
+                A list of dictionaries containing information about the videos.
+            """
+            if youtube_api_key is None:
+                raise ValueError("YouTube API key is required")
+
+            return _youtube_search(query, youtube_api_key, max_results, include_video_details)
+
+        super().__init__(
+            name="youtube_search",
+            description="Search for YouTube videos based on a query, optionally including detailed information.",
+            func_or_tool=youtube_search,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/__init__.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/__init__.py
new file mode 100644
index 0000000..294a980
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/__init__.py
@@ -0,0 +1,17 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .discord import DiscordRetrieveTool, DiscordSendTool
+from .slack import SlackRetrieveRepliesTool, SlackRetrieveTool, SlackSendTool
+from .telegram import TelegramRetrieveTool, TelegramSendTool
+
+__all__ = [
+    "DiscordRetrieveTool",
+    "DiscordSendTool",
+    "SlackRetrieveRepliesTool",
+    "SlackRetrieveTool",
+    "SlackSendTool",
+    "TelegramRetrieveTool",
+    "TelegramSendTool",
+]
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/__init__.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/__init__.py
new file mode 100644
index 0000000..ad1fff1
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .discord import DiscordRetrieveTool, DiscordSendTool
+
+__all__ = ["DiscordRetrieveTool", "DiscordSendTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/discord.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/discord.py
new file mode 100644
index 0000000..4b7603c
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/discord/discord.py
@@ -0,0 +1,288 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+from datetime import datetime, timezone
+from typing import Annotated, Any, Union
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block, require_optional_import
+from .... import Tool
+from ....dependency_injection import Depends, on
+
+__all__ = ["DiscordRetrieveTool", "DiscordSendTool"]
+
+with optional_import_block():
+    from discord import Client, Intents, utils
+
+MAX_MESSAGE_LENGTH = 2000
+MAX_BATCH_RETRIEVE_MESSAGES = 100  # Discord's max per request
+
+
+@require_optional_import(["discord"], "commsagent-discord")
+@export_module("autogen.tools.experimental")
+class DiscordSendTool(Tool):
+    """Sends a message to a Discord channel."""
+
+    def __init__(self, *, bot_token: str, channel_name: str, guild_name: str) -> None:
+        """
+        Initialize the DiscordSendTool.
+
+        Args:
+            bot_token: The bot token to use for sending messages.
+            channel_name: The name of the channel to send messages to.
+            guild_name: The name of the guild for the channel.
+        """
+
+        # Function that sends the message, uses dependency injection for bot token / channel / guild
+        async def discord_send_message(
+            message: Annotated[str, "Message to send to the channel."],
+            bot_token: Annotated[str, Depends(on(bot_token))],
+            guild_name: Annotated[str, Depends(on(guild_name))],
+            channel_name: Annotated[str, Depends(on(channel_name))],
+        ) -> Any:
+            """
+            Sends a message to a Discord channel.
+
+            Args:
+                message: The message to send to the channel.
+                bot_token: The bot token to use for Discord. (uses dependency injection)
+                guild_name: The name of the server. (uses dependency injection)
+                channel_name: The name of the channel. (uses dependency injection)
+            """
+            intents = Intents.default()
+            intents.message_content = True
+            intents.guilds = True
+            intents.guild_messages = True
+
+            client = Client(intents=intents)
+            result_future: asyncio.Future[str] = asyncio.Future()  # Stores the result of the send
+
+            # When the client is ready, we'll send the message
+            @client.event  # type: ignore[misc]
+            async def on_ready() -> None:
+                try:
+                    # Server
+                    guild = utils.get(client.guilds, name=guild_name)
+                    if guild:
+                        # Channel
+                        channel = utils.get(guild.text_channels, name=channel_name)
+                        if channel:
+                            # Send the message
+                            if len(message) > MAX_MESSAGE_LENGTH:
+                                chunks = [
+                                    message[i : i + (MAX_MESSAGE_LENGTH - 1)]
+                                    for i in range(0, len(message), (MAX_MESSAGE_LENGTH - 1))
+                                ]
+                                for i, chunk in enumerate(chunks):
+                                    sent = await channel.send(chunk)
+
+                                    # Store ID for the first chunk
+                                    if i == 0:
+                                        sent_message_id = str(sent.id)
+
+                                result_future.set_result(
+                                    f"Message sent successfully ({len(chunks)} chunks, first ID: {sent_message_id}):\n{message}"
+                                )
+                            else:
+                                sent = await channel.send(message)
+                                result_future.set_result(f"Message sent successfully (ID: {sent.id}):\n{message}")
+                        else:
+                            result_future.set_result(f"Message send failed, could not find channel: {channel_name}")
+                    else:
+                        result_future.set_result(f"Message send failed, could not find guild: {guild_name}")
+
+                except Exception as e:
+                    result_future.set_exception(e)
+                finally:
+                    try:
+                        await client.close()
+                    except Exception as e:
+                        raise Exception(f"Unable to close Discord client: {e}")
+
+            # Start the client and when it's ready it'll send the message in on_ready
+            try:
+                await client.start(bot_token)
+
+                # Capture the result of the send
+                return await result_future
+            except Exception as e:
+                raise Exception(f"Failed to start Discord client: {e}")
+
+        super().__init__(
+            name="discord_send",
+            description="Sends a message to a Discord channel.",
+            func_or_tool=discord_send_message,
+        )
+
+
+@require_optional_import(["discord"], "commsagent-discord")
+@export_module("autogen.tools.experimental")
+class DiscordRetrieveTool(Tool):
+    """Retrieves messages from a Discord channel."""
+
+    def __init__(self, *, bot_token: str, channel_name: str, guild_name: str) -> None:
+        """
+        Initialize the DiscordRetrieveTool.
+
+        Args:
+            bot_token: The bot token to use for retrieving messages.
+            channel_name: The name of the channel to retrieve messages from.
+            guild_name: The name of the guild for the channel.
+        """
+
+        async def discord_retrieve_messages(
+            bot_token: Annotated[str, Depends(on(bot_token))],
+            guild_name: Annotated[str, Depends(on(guild_name))],
+            channel_name: Annotated[str, Depends(on(channel_name))],
+            messages_since: Annotated[
+                Union[str, None],
+                "Date to retrieve messages from (ISO format) OR Discord snowflake ID. If None, retrieves latest messages.",
+            ] = None,
+            maximum_messages: Annotated[
+                Union[int, None], "Maximum number of messages to retrieve. If None, retrieves all messages since date."
+            ] = None,
+        ) -> Any:
+            """
+            Retrieves messages from a Discord channel.
+
+            Args:
+                bot_token: The bot token to use for Discord. (uses dependency injection)
+                guild_name: The name of the server. (uses dependency injection)
+                channel_name: The name of the channel. (uses dependency injection)
+                messages_since: ISO format date string OR Discord snowflake ID, to retrieve messages from. If None, retrieves latest messages.
+                maximum_messages: Maximum number of messages to retrieve. If None, retrieves all messages since date.
+            """
+            intents = Intents.default()
+            intents.message_content = True
+            intents.guilds = True
+            intents.guild_messages = True
+
+            client = Client(intents=intents)
+            result_future: asyncio.Future[list[dict[str, Any]]] = asyncio.Future()
+
+            messages_since_date: Union[str, None] = None
+            if messages_since is not None:
+                if DiscordRetrieveTool._is_snowflake(messages_since):
+                    messages_since_date = DiscordRetrieveTool._snowflake_to_iso(messages_since)
+                else:
+                    messages_since_date = messages_since
+
+            @client.event  # type: ignore[misc]
+            async def on_ready() -> None:
+                try:
+                    messages = []
+
+                    # Get guild and channel
+                    guild = utils.get(client.guilds, name=guild_name)
+                    if not guild:
+                        result_future.set_result([{"error": f"Could not find guild: {guild_name}"}])
+                        return
+
+                    channel = utils.get(guild.text_channels, name=channel_name)
+                    if not channel:
+                        result_future.set_result([{"error": f"Could not find channel: {channel_name}"}])
+                        return
+
+                    # Setup retrieval parameters
+                    last_message_id = None
+                    messages_retrieved = 0
+
+                    # Convert to ISO format
+                    after_date = None
+                    if messages_since_date:
+                        try:
+                            from datetime import datetime
+
+                            after_date = datetime.fromisoformat(messages_since_date)
+                        except ValueError:
+                            result_future.set_result([
+                                {"error": f"Invalid date format: {messages_since_date}. Use ISO format."}
+                            ])
+                            return
+
+                    while True:
+                        # Setup fetch options
+                        fetch_options = {
+                            "limit": MAX_BATCH_RETRIEVE_MESSAGES,
+                            "before": last_message_id if last_message_id else None,
+                            "after": after_date if after_date else None,
+                        }
+
+                        # Fetch batch of messages
+                        message_batch = []
+                        async for message in channel.history(**fetch_options):  # type: ignore[arg-type]
+                            message_batch.append(message)
+                            messages_retrieved += 1
+
+                            # Check if we've reached the maximum
+                            if maximum_messages and messages_retrieved >= maximum_messages:
+                                break
+
+                        if not message_batch:
+                            break
+
+                        # Process messages
+                        for msg in message_batch:
+                            messages.append({
+                                "id": str(msg.id),
+                                "content": msg.content,
+                                "author": str(msg.author),
+                                "timestamp": msg.created_at.isoformat(),
+                            })
+
+                        # Update last message ID for pagination
+                        last_message_id = message_batch[-1]  # Use message object directly as 'before' parameter
+
+                        # Break if we've reached the maximum
+                        if maximum_messages and messages_retrieved >= maximum_messages:
+                            break
+
+                    result_future.set_result(messages)
+
+                except Exception as e:
+                    result_future.set_exception(e)
+                finally:
+                    try:
+                        await client.close()
+                    except Exception as e:
+                        raise Exception(f"Unable to close Discord client: {e}")
+
+            try:
+                await client.start(bot_token)
+                return await result_future
+            except Exception as e:
+                raise Exception(f"Failed to start Discord client: {e}")
+
+        super().__init__(
+            name="discord_retrieve",
+            description="Retrieves messages from a Discord channel based datetime/message ID and/or number of latest messages.",
+            func_or_tool=discord_retrieve_messages,
+        )
+
+    @staticmethod
+    def _is_snowflake(value: str) -> bool:
+        """Check if a string is a valid Discord snowflake ID."""
+        # Must be numeric and 17-20 digits
+        if not value.isdigit():
+            return False
+
+        digit_count = len(value)
+        return 17 <= digit_count <= 20
+
+    @staticmethod
+    def _snowflake_to_iso(snowflake: str) -> str:
+        """Convert a Discord snowflake ID to ISO timestamp string."""
+        if not DiscordRetrieveTool._is_snowflake(snowflake):
+            raise ValueError(f"Invalid snowflake ID: {snowflake}")
+
+        # Discord epoch (2015-01-01)
+        discord_epoch = 1420070400000
+
+        # Convert ID to int and shift right 22 bits to get timestamp
+        timestamp_ms = (int(snowflake) >> 22) + discord_epoch
+
+        # Convert to datetime and format as ISO string
+        dt = datetime.fromtimestamp(timestamp_ms / 1000.0, tz=timezone.utc)
+        return dt.isoformat()
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/__init__.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/__init__.py
new file mode 100644
index 0000000..588d8a3
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .slack import SlackRetrieveRepliesTool, SlackRetrieveTool, SlackSendTool
+
+__all__ = ["SlackRetrieveRepliesTool", "SlackRetrieveTool", "SlackSendTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/slack.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/slack.py
new file mode 100644
index 0000000..d24db5f
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/slack/slack.py
@@ -0,0 +1,391 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+from datetime import datetime, timedelta
+from typing import Annotated, Any, Optional, Tuple, Union
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block, require_optional_import
+from .... import Tool
+from ....dependency_injection import Depends, on
+
+__all__ = ["SlackSendTool"]
+
+with optional_import_block():
+    from slack_sdk import WebClient
+    from slack_sdk.errors import SlackApiError
+
+MAX_MESSAGE_LENGTH = 40000
+
+
+@require_optional_import(["slack_sdk"], "commsagent-slack")
+@export_module("autogen.tools.experimental")
+class SlackSendTool(Tool):
+    """Sends a message to a Slack channel."""
+
+    def __init__(self, *, bot_token: str, channel_id: str) -> None:
+        """
+        Initialize the SlackSendTool.
+
+        Args:
+            bot_token: Bot User OAuth Token starting with "xoxb-".
+            channel_id: Channel ID where messages will be sent.
+        """
+
+        # Function that sends the message, uses dependency injection for bot token / channel / guild
+        async def slack_send_message(
+            message: Annotated[str, "Message to send to the channel."],
+            bot_token: Annotated[str, Depends(on(bot_token))],
+            channel_id: Annotated[str, Depends(on(channel_id))],
+        ) -> Any:
+            """
+            Sends a message to a Slack channel.
+
+            Args:
+                message: The message to send to the channel.
+                bot_token: The bot token to use for Slack. (uses dependency injection)
+                channel_id: The ID of the channel. (uses dependency injection)
+            """
+            try:
+                web_client = WebClient(token=bot_token)
+
+                # Send the message
+                if len(message) > MAX_MESSAGE_LENGTH:
+                    chunks = [
+                        message[i : i + (MAX_MESSAGE_LENGTH - 1)]
+                        for i in range(0, len(message), (MAX_MESSAGE_LENGTH - 1))
+                    ]
+                    for i, chunk in enumerate(chunks):
+                        response = web_client.chat_postMessage(channel=channel_id, text=chunk)
+
+                        if not response["ok"]:
+                            return f"Message send failed on chunk {i + 1}, Slack response error: {response['error']}"
+
+                        # Store ID for the first chunk
+                        if i == 0:
+                            sent_message_id = response["ts"]
+
+                    return f"Message sent successfully ({len(chunks)} chunks, first ID: {sent_message_id}):\n{message}"
+                else:
+                    response = web_client.chat_postMessage(channel=channel_id, text=message)
+
+                    if not response["ok"]:
+                        return f"Message send failed, Slack response error: {response['error']}"
+
+                    return f"Message sent successfully (ID: {response['ts']}):\n{message}"
+            except SlackApiError as e:
+                return f"Message send failed, Slack API exception: {e.response['error']} (See https://api.slack.com/automation/cli/errors#{e.response['error']})"
+            except Exception as e:
+                return f"Message send failed, exception: {e}"
+
+        super().__init__(
+            name="slack_send",
+            description="Sends a message to a Slack channel.",
+            func_or_tool=slack_send_message,
+        )
+
+
+@require_optional_import(["slack_sdk"], "commsagent-slack")
+@export_module("autogen.tools.experimental")
+class SlackRetrieveTool(Tool):
+    """Retrieves messages from a Slack channel."""
+
+    def __init__(self, *, bot_token: str, channel_id: str) -> None:
+        """
+        Initialize the SlackRetrieveTool.
+
+        Args:
+            bot_token: Bot User OAuth Token starting with "xoxb-".
+            channel_id: Channel ID where messages will be sent.
+        """
+
+        async def slack_retrieve_messages(
+            bot_token: Annotated[str, Depends(on(bot_token))],
+            channel_id: Annotated[str, Depends(on(channel_id))],
+            messages_since: Annotated[
+                Union[str, None],
+                "Date to retrieve messages from (ISO format) OR Slack message ID. If None, retrieves latest messages.",
+            ] = None,
+            maximum_messages: Annotated[
+                Union[int, None], "Maximum number of messages to retrieve. If None, retrieves all messages since date."
+            ] = None,
+        ) -> Any:
+            """
+            Retrieves messages from a Discord channel.
+
+            Args:
+                bot_token: The bot token to use for Discord. (uses dependency injection)
+                channel_id: The ID of the channel. (uses dependency injection)
+                messages_since: ISO format date string OR Slack message ID, to retrieve messages from. If None, retrieves latest messages.
+                maximum_messages: Maximum number of messages to retrieve. If None, retrieves all messages since date.
+            """
+            try:
+                web_client = WebClient(token=bot_token)
+
+                # Convert ISO datetime to Unix timestamp if needed
+                oldest = None
+                if messages_since:
+                    if "." in messages_since:  # Likely a Slack message ID
+                        oldest = messages_since
+                    else:  # Assume ISO format
+                        try:
+                            dt = datetime.fromisoformat(messages_since.replace("Z", "+00:00"))
+                            oldest = str(dt.timestamp())
+                        except ValueError as e:
+                            return f"Invalid date format. Please provide either a Slack message ID or ISO format date (e.g., '2025-01-25T00:00:00Z'). Error: {e}"
+
+                messages = []
+                cursor = None
+
+                while True:
+                    try:
+                        # Prepare API call parameters
+                        params = {
+                            "channel": channel_id,
+                            "limit": min(1000, maximum_messages) if maximum_messages else 1000,
+                        }
+                        if oldest:
+                            params["oldest"] = oldest
+                        if cursor:
+                            params["cursor"] = cursor
+
+                        # Make API call
+                        response = web_client.conversations_history(**params)  # type: ignore[arg-type]
+
+                        if not response["ok"]:
+                            return f"Message retrieval failed, Slack response error: {response['error']}"
+
+                        # Add messages to our list
+                        messages.extend(response["messages"])
+
+                        # Check if we've hit our maximum
+                        if maximum_messages and len(messages) >= maximum_messages:
+                            messages = messages[:maximum_messages]
+                            break
+
+                        # Check if there are more messages
+                        if not response["has_more"]:
+                            break
+
+                        cursor = response["response_metadata"]["next_cursor"]
+
+                    except SlackApiError as e:
+                        return f"Message retrieval failed on pagination, Slack API error: {e.response['error']}"
+
+                return {
+                    "message_count": len(messages),
+                    "messages": messages,
+                    "start_time": oldest or "latest",
+                }
+
+            except SlackApiError as e:
+                return f"Message retrieval failed, Slack API exception: {e.response['error']} (See https://api.slack.com/automation/cli/errors#{e.response['error']})"
+            except Exception as e:
+                return f"Message retrieval failed, exception: {e}"
+
+        super().__init__(
+            name="slack_retrieve",
+            description="Retrieves messages from a Slack channel based datetime/message ID and/or number of latest messages.",
+            func_or_tool=slack_retrieve_messages,
+        )
+
+
+@require_optional_import(["slack_sdk"], "commsagent-slack")
+@export_module("autogen.tools.experimental")
+class SlackRetrieveRepliesTool(Tool):
+    """Retrieves replies to a specific Slack message from both threads and the channel."""
+
+    def __init__(self, *, bot_token: str, channel_id: str) -> None:
+        """
+        Initialize the SlackRetrieveRepliesTool.
+
+        Args:
+            bot_token: Bot User OAuth Token starting with "xoxb-".
+            channel_id: Channel ID where the parent message exists.
+        """
+
+        async def slack_retrieve_replies(
+            message_ts: Annotated[str, "Timestamp (ts) of the parent message to retrieve replies for."],
+            bot_token: Annotated[str, Depends(on(bot_token))],
+            channel_id: Annotated[str, Depends(on(channel_id))],
+            min_replies: Annotated[
+                Optional[int],
+                "Minimum number of replies to wait for before returning (thread + channel). If None, returns immediately.",
+            ] = None,
+            timeout_seconds: Annotated[
+                int, "Maximum time in seconds to wait for the requested number of replies."
+            ] = 60,
+            poll_interval: Annotated[int, "Time in seconds between polling attempts when waiting for replies."] = 5,
+            include_channel_messages: Annotated[
+                bool, "Whether to include messages in the channel after the original message."
+            ] = True,
+        ) -> Any:
+            """
+            Retrieves replies to a specific Slack message, from both threads and the main channel.
+
+            Args:
+                message_ts: The timestamp (ts) identifier of the parent message.
+                bot_token: The bot token to use for Slack. (uses dependency injection)
+                channel_id: The ID of the channel. (uses dependency injection)
+                min_replies: Minimum number of combined replies to wait for before returning. If None, returns immediately.
+                timeout_seconds: Maximum time in seconds to wait for the requested number of replies.
+                poll_interval: Time in seconds between polling attempts when waiting for replies.
+                include_channel_messages: Whether to include messages posted in the channel after the original message.
+            """
+            try:
+                web_client = WebClient(token=bot_token)
+
+                # Function to get current thread replies
+                async def get_thread_replies() -> tuple[Optional[list[dict[str, Any]]], Optional[str]]:
+                    try:
+                        response = web_client.conversations_replies(
+                            channel=channel_id,
+                            ts=message_ts,
+                        )
+
+                        if not response["ok"]:
+                            return None, f"Thread reply retrieval failed, Slack response error: {response['error']}"
+
+                        # The first message is the parent message itself, so exclude it when counting replies
+                        replies = response["messages"][1:] if len(response["messages"]) > 0 else []
+                        return replies, None
+
+                    except SlackApiError as e:
+                        return None, f"Thread reply retrieval failed, Slack API exception: {e.response['error']}"
+                    except Exception as e:
+                        return None, f"Thread reply retrieval failed, exception: {e}"
+
+                # Function to get messages in the channel after the original message
+                async def get_channel_messages() -> Tuple[Optional[list[dict[str, Any]]], Optional[str]]:
+                    try:
+                        response = web_client.conversations_history(
+                            channel=channel_id,
+                            oldest=message_ts,  # Start from the original message timestamp
+                            inclusive=False,  # Don't include the original message
+                        )
+
+                        if not response["ok"]:
+                            return None, f"Channel message retrieval failed, Slack response error: {response['error']}"
+
+                        # Return all messages in the channel after the original message
+                        # We need to filter out any that are part of the thread we're already getting
+                        messages = []
+                        for msg in response["messages"]:
+                            # Skip if the message is part of the thread we're already retrieving
+                            if "thread_ts" in msg and msg["thread_ts"] == message_ts:
+                                continue
+                            messages.append(msg)
+
+                        return messages, None
+
+                    except SlackApiError as e:
+                        return None, f"Channel message retrieval failed, Slack API exception: {e.response['error']}"
+                    except Exception as e:
+                        return None, f"Channel message retrieval failed, exception: {e}"
+
+                # Function to get all replies (both thread and channel)
+                async def get_all_replies() -> Tuple[
+                    Optional[list[dict[str, Any]]], Optional[list[dict[str, Any]]], Optional[str]
+                ]:
+                    thread_replies, thread_error = await get_thread_replies()
+                    if thread_error:
+                        return None, None, thread_error
+
+                    channel_messages: list[dict[str, Any]] = []
+                    channel_error = None
+
+                    if include_channel_messages:
+                        channel_results, channel_error = await get_channel_messages()
+                        if channel_error:
+                            return thread_replies, None, channel_error
+                        channel_messages = channel_results if channel_results is not None else []
+
+                    return thread_replies, channel_messages, None
+
+                # If no waiting is required, just get replies and return
+                if min_replies is None:
+                    thread_replies, channel_messages, error = await get_all_replies()
+                    if error:
+                        return error
+
+                    thread_replies_list: list[dict[str, Any]] = [] if thread_replies is None else thread_replies
+                    channel_messages_list: list[dict[str, Any]] = [] if channel_messages is None else channel_messages
+
+                    # Combine replies for counting but keep them separate in the result
+                    total_reply_count = len(thread_replies_list) + len(channel_messages_list)
+
+                    return {
+                        "parent_message_ts": message_ts,
+                        "total_reply_count": total_reply_count,
+                        "thread_replies": thread_replies_list,
+                        "thread_reply_count": len(thread_replies_list),
+                        "channel_messages": channel_messages_list if include_channel_messages else None,
+                        "channel_message_count": len(channel_messages_list) if include_channel_messages else None,
+                    }
+
+                # Wait for the required number of replies with timeout
+                start_time = datetime.now()
+                end_time = start_time + timedelta(seconds=timeout_seconds)
+
+                while datetime.now() < end_time:
+                    thread_replies, channel_messages, error = await get_all_replies()
+                    if error:
+                        return error
+
+                    thread_replies_current: list[dict[str, Any]] = [] if thread_replies is None else thread_replies
+                    channel_messages_current: list[dict[str, Any]] = (
+                        [] if channel_messages is None else channel_messages
+                    )
+
+                    # Combine replies for counting
+                    total_reply_count = len(thread_replies_current) + len(channel_messages_current)
+
+                    # If we have enough total replies, return them
+                    if total_reply_count >= min_replies:
+                        return {
+                            "parent_message_ts": message_ts,
+                            "total_reply_count": total_reply_count,
+                            "thread_replies": thread_replies_current,
+                            "thread_reply_count": len(thread_replies_current),
+                            "channel_messages": channel_messages_current if include_channel_messages else None,
+                            "channel_message_count": len(channel_messages_current)
+                            if include_channel_messages
+                            else None,
+                            "waited_seconds": (datetime.now() - start_time).total_seconds(),
+                        }
+
+                    # Wait before checking again
+                    await asyncio.sleep(poll_interval)
+
+                # If we reach here, we timed out waiting for replies
+                thread_replies, channel_messages, error = await get_all_replies()
+                if error:
+                    return error
+
+                # Combine replies for counting
+                total_reply_count = len(thread_replies or []) + len(channel_messages or [])
+
+                return {
+                    "parent_message_ts": message_ts,
+                    "total_reply_count": total_reply_count,
+                    "thread_replies": thread_replies or [],
+                    "thread_reply_count": len(thread_replies or []),
+                    "channel_messages": channel_messages or [] if include_channel_messages else None,
+                    "channel_message_count": len(channel_messages or []) if include_channel_messages else None,
+                    "timed_out": True,
+                    "waited_seconds": timeout_seconds,
+                    "requested_replies": min_replies,
+                }
+
+            except SlackApiError as e:
+                return f"Reply retrieval failed, Slack API exception: {e.response['error']} (See https://api.slack.com/automation/cli/errors#{e.response['error']})"
+            except Exception as e:
+                return f"Reply retrieval failed, exception: {e}"
+
+        super().__init__(
+            name="slack_retrieve_replies",
+            description="Retrieves replies to a specific Slack message, checking both thread replies and messages in the channel after the original message.",
+            func_or_tool=slack_retrieve_replies,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/__init__.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/__init__.py
new file mode 100644
index 0000000..b106039
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .telegram import TelegramRetrieveTool, TelegramSendTool
+
+__all__ = ["TelegramRetrieveTool", "TelegramSendTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/telegram.py b/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/telegram.py
new file mode 100644
index 0000000..dd9a799
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/messageplatform/telegram/telegram.py
@@ -0,0 +1,275 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from datetime import datetime
+from typing import Annotated, Any, Union
+
+from .....doc_utils import export_module
+from .....import_utils import optional_import_block, require_optional_import
+from .... import Tool
+from ....dependency_injection import Depends, on
+
+__all__ = ["TelegramRetrieveTool", "TelegramSendTool"]
+
+with optional_import_block():
+    from telethon import TelegramClient
+    from telethon.tl.types import InputMessagesFilterEmpty, Message, PeerChannel, PeerChat, PeerUser
+
+MAX_MESSAGE_LENGTH = 4096
+
+
+@require_optional_import(["telethon", "telethon.tl.types"], "commsagent-telegram")
+@export_module("autogen.tools.experimental")
+class BaseTelegramTool:
+    """Base class for Telegram tools containing shared functionality."""
+
+    def __init__(self, api_id: str, api_hash: str, session_name: str) -> None:
+        self._api_id = api_id
+        self._api_hash = api_hash
+        self._session_name = session_name
+
+    def _get_client(self) -> "TelegramClient":  # type: ignore[no-any-unimported]
+        """Get a fresh TelegramClient instance."""
+        return TelegramClient(self._session_name, self._api_id, self._api_hash)
+
+    @staticmethod
+    def _get_peer_from_id(chat_id: str) -> Union["PeerChat", "PeerChannel", "PeerUser"]:  # type: ignore[no-any-unimported]
+        """Convert a chat ID string to appropriate Peer type."""
+        try:
+            # Convert string to integer
+            id_int = int(chat_id)
+
+            # Channel/Supergroup: -100 prefix
+            if str(chat_id).startswith("-100"):
+                channel_id = int(str(chat_id)[4:])  # Remove -100 prefix
+                return PeerChannel(channel_id)
+
+            # Group: negative number without -100 prefix
+            elif id_int < 0:
+                group_id = -id_int  # Remove the negative sign
+                return PeerChat(group_id)
+
+            # User/Bot: positive number
+            else:
+                return PeerUser(id_int)
+
+        except ValueError as e:
+            raise ValueError(f"Invalid chat_id format: {chat_id}. Error: {str(e)}")
+
+    async def _initialize_entity(self, client: "TelegramClient", chat_id: str) -> Any:  # type: ignore[no-any-unimported]
+        """Initialize and cache the entity by trying different methods."""
+        peer = self._get_peer_from_id(chat_id)
+
+        try:
+            # Try direct entity resolution first
+            entity = await client.get_entity(peer)
+            return entity
+        except ValueError:
+            try:
+                # Get all dialogs (conversations)
+                async for dialog in client.iter_dialogs():
+                    # For users/bots, we need to find the dialog with the user
+                    if (
+                        isinstance(peer, PeerUser)
+                        and dialog.entity.id == peer.user_id
+                        or dialog.entity.id == getattr(peer, "channel_id", getattr(peer, "chat_id", None))
+                    ):
+                        return dialog.entity
+
+                # If we get here, we didn't find the entity in dialogs
+                raise ValueError(f"Could not find entity {chat_id} in dialogs")
+            except Exception as e:
+                raise ValueError(
+                    f"Could not initialize entity for {chat_id}. "
+                    f"Make sure you have access to this chat. Error: {str(e)}"
+                )
+
+
+@require_optional_import(["telethon"], "commsagent-telegram")
+@export_module("autogen.tools.experimental")
+class TelegramSendTool(BaseTelegramTool, Tool):
+    """Sends a message to a Telegram channel, group, or user."""
+
+    def __init__(self, *, api_id: str, api_hash: str, chat_id: str) -> None:
+        """
+        Initialize the TelegramSendTool.
+
+        Args:
+            api_id: Telegram API ID from https://my.telegram.org/apps.
+            api_hash: Telegram API hash from https://my.telegram.org/apps.
+            chat_id: The ID of the destination (Channel, Group, or User ID).
+        """
+        BaseTelegramTool.__init__(self, api_id, api_hash, "telegram_send_session")
+
+        async def telegram_send_message(
+            message: Annotated[str, "Message to send to the chat."],
+            chat_id: Annotated[str, Depends(on(chat_id))],
+        ) -> Any:
+            """
+            Sends a message to a Telegram chat.
+
+            Args:
+                message: The message to send.
+                chat_id: The ID of the destination. (uses dependency injection)
+            """
+            try:
+                client = self._get_client()
+                async with client:
+                    # Initialize and cache the entity
+                    entity = await self._initialize_entity(client, chat_id)
+
+                    if len(message) > MAX_MESSAGE_LENGTH:
+                        chunks = [
+                            message[i : i + (MAX_MESSAGE_LENGTH - 1)]
+                            for i in range(0, len(message), (MAX_MESSAGE_LENGTH - 1))
+                        ]
+                        first_message: Union[Message, None] = None  # type: ignore[no-any-unimported]
+
+                        for i, chunk in enumerate(chunks):
+                            sent = await client.send_message(
+                                entity=entity,
+                                message=chunk,
+                                parse_mode="html",
+                                reply_to=first_message.id if first_message else None,
+                            )
+
+                            # Store the first message to chain replies
+                            if i == 0:
+                                first_message = sent
+                                sent_message_id = str(sent.id)
+
+                        return (
+                            f"Message sent successfully ({len(chunks)} chunks, first ID: {sent_message_id}):\n{message}"
+                        )
+                    else:
+                        sent = await client.send_message(entity=entity, message=message, parse_mode="html")
+                        return f"Message sent successfully (ID: {sent.id}):\n{message}"
+
+            except Exception as e:
+                return f"Message send failed, exception: {str(e)}"
+
+        Tool.__init__(
+            self,
+            name="telegram_send",
+            description="Sends a message to a personal channel, bot channel, group, or channel.",
+            func_or_tool=telegram_send_message,
+        )
+
+
+@require_optional_import(["telethon"], "commsagent-telegram")
+@export_module("autogen.tools.experimental")
+class TelegramRetrieveTool(BaseTelegramTool, Tool):
+    """Retrieves messages from a Telegram channel."""
+
+    def __init__(self, *, api_id: str, api_hash: str, chat_id: str) -> None:
+        """
+        Initialize the TelegramRetrieveTool.
+
+        Args:
+            api_id: Telegram API ID from https://my.telegram.org/apps.
+            api_hash: Telegram API hash from https://my.telegram.org/apps.
+            chat_id: The ID of the chat to retrieve messages from (Channel, Group, Bot Chat ID).
+        """
+        BaseTelegramTool.__init__(self, api_id, api_hash, "telegram_retrieve_session")
+        self._chat_id = chat_id
+
+        async def telegram_retrieve_messages(
+            chat_id: Annotated[str, Depends(on(chat_id))],
+            messages_since: Annotated[
+                Union[str, None],
+                "Date to retrieve messages from (ISO format) OR message ID. If None, retrieves latest messages.",
+            ] = None,
+            maximum_messages: Annotated[
+                Union[int, None], "Maximum number of messages to retrieve. If None, retrieves all messages since date."
+            ] = None,
+            search: Annotated[Union[str, None], "Optional string to search for in messages."] = None,
+        ) -> Any:
+            """
+            Retrieves messages from a Telegram chat.
+
+            Args:
+                chat_id: The ID of the chat. (uses dependency injection)
+                messages_since: ISO format date string OR message ID to retrieve messages from.
+                maximum_messages: Maximum number of messages to retrieve.
+                search: Optional string to search for in messages.
+            """
+            try:
+                client = self._get_client()
+                async with client:
+                    # Initialize and cache the entity
+                    entity = await self._initialize_entity(client, chat_id)
+
+                    # Setup retrieval parameters
+                    params = {
+                        "entity": entity,
+                        "limit": maximum_messages if maximum_messages else None,
+                        "search": search if search else None,
+                        "filter": InputMessagesFilterEmpty(),
+                        "wait_time": None,  # No wait time between requests
+                    }
+
+                    # Handle messages_since parameter
+                    if messages_since:
+                        try:
+                            # Try to parse as message ID first
+                            msg_id = int(messages_since)
+                            params["min_id"] = msg_id
+                        except ValueError:
+                            # Not a message ID, try as ISO date
+                            try:
+                                date = datetime.fromisoformat(messages_since.replace("Z", "+00:00"))
+                                params["offset_date"] = date
+                                params["reverse"] = (
+                                    True  # Need this because the date gets messages before a certain date by default
+                                )
+                            except ValueError:
+                                return {
+                                    "error": "Invalid messages_since format. Please provide either a message ID or ISO format date (e.g., '2025-01-25T00:00:00Z')"
+                                }
+
+                    # Retrieve messages
+                    messages = []
+                    count = 0
+                    # For bot users, we need to get both sent and received messages
+                    if isinstance(self._get_peer_from_id(chat_id), PeerUser):
+                        print(f"Retrieving messages for bot chat {chat_id}")
+
+                    async for message in client.iter_messages(**params):
+                        count += 1
+                        messages.append({
+                            "id": str(message.id),
+                            "date": message.date.isoformat(),
+                            "from_id": str(message.from_id) if message.from_id else None,
+                            "text": message.text,
+                            "reply_to_msg_id": str(message.reply_to_msg_id) if message.reply_to_msg_id else None,
+                            "forward_from": str(message.forward.from_id) if message.forward else None,
+                            "edit_date": message.edit_date.isoformat() if message.edit_date else None,
+                            "media": bool(message.media),
+                            "entities": [
+                                {"type": e.__class__.__name__, "offset": e.offset, "length": e.length}
+                                for e in message.entities
+                            ]
+                            if message.entities
+                            else None,
+                        })
+
+                        # Check if we've hit the maximum
+                        if maximum_messages and len(messages) >= maximum_messages:
+                            break
+
+                    return {
+                        "message_count": len(messages),
+                        "messages": messages,
+                        "start_time": messages_since or "latest",
+                    }
+
+            except Exception as e:
+                return f"Message retrieval failed, exception: {str(e)}"
+
+        Tool.__init__(
+            self,
+            name="telegram_retrieve",
+            description="Retrieves messages from a Telegram chat based on datetime/message ID and/or number of latest messages.",
+            func_or_tool=telegram_retrieve_messages,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/perplexity/__init__.py b/mm_agents/coact/autogen/tools/experimental/perplexity/__init__.py
new file mode 100644
index 0000000..bae5263
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/perplexity/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .perplexity_search import PerplexitySearchTool
+
+__all__ = ["PerplexitySearchTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/perplexity/perplexity_search.py b/mm_agents/coact/autogen/tools/experimental/perplexity/perplexity_search.py
new file mode 100644
index 0000000..4176f49
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/perplexity/perplexity_search.py
@@ -0,0 +1,260 @@
+"""
+Module: perplexity_search_tool
+Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+SPDX-License-Identifier: Apache-2.0
+
+This module provides classes for interacting with the Perplexity AI search API.
+It defines data models for responses and a tool for executing web and conversational searches.
+"""
+
+import json
+import os
+from typing import Any, Optional, Union
+
+import requests
+from pydantic import BaseModel, ValidationError
+
+from autogen.tools import Tool
+
+
+class Message(BaseModel):
+    """
+    Represents a message in the chat conversation.
+
+    Attributes:
+        role (str): The role of the message sender (e.g., "system", "user").
+        content (str): The text content of the message.
+    """
+
+    role: str
+    content: str
+
+
+class Usage(BaseModel):
+    """
+    Model representing token usage details.
+
+    Attributes:
+        prompt_tokens (int): The number of tokens used for the prompt.
+        completion_tokens (int): The number of tokens generated in the completion.
+        total_tokens (int): The total number of tokens (prompt + completion).
+        search_context_size (str): The size context used in the search (e.g., "high").
+    """
+
+    prompt_tokens: int
+    completion_tokens: int
+    total_tokens: int
+    search_context_size: str
+
+
+class Choice(BaseModel):
+    """
+    Represents one choice in the response from the Perplexity API.
+
+    Attributes:
+        index (int): The index of this choice.
+        finish_reason (str): The reason why the API finished generating this choice.
+        message (Message): The message object containing the response text.
+    """
+
+    index: int
+    finish_reason: str
+    message: Message
+
+
+class PerplexityChatCompletionResponse(BaseModel):
+    """
+    Represents the full chat completion response from the Perplexity API.
+
+    Attributes:
+        id (str): Unique identifier for the response.
+        model (str): The model name used for generating the response.
+        created (int): Timestamp when the response was created.
+        usage (Usage): Token usage details.
+        citations (list[str]): list of citation strings included in the response.
+        object (str): Type of the response object.
+        choices (list[Choice]): list of choices returned by the API.
+    """
+
+    id: str
+    model: str
+    created: int
+    usage: Usage
+    citations: list[str]
+    object: str
+    choices: list[Choice]
+
+
+class SearchResponse(BaseModel):
+    """
+    Represents the response from a search query.
+
+    Attributes:
+        content (Optional[str]): The textual content returned from the search.
+        citations (Optional[list[str]]): A list of citation URLs relevant to the search result.
+        error (Optional[str]): An error message if the search failed.
+    """
+
+    content: Union[str, None]
+    citations: Union[list[str], None]
+    error: Union[str, None]
+
+
+class PerplexitySearchTool(Tool):
+    """
+    Tool for interacting with the Perplexity AI search API.
+
+    This tool uses the Perplexity API to perform web search, news search,
+    and conversational search, returning concise and precise responses.
+
+    Attributes:
+        url (str): API endpoint URL.
+        model (str): Name of the model to be used.
+        api_key (str): API key for authenticating with the Perplexity API.
+        max_tokens (int): Maximum tokens allowed for the API response.
+        search_domain_filters (Optional[list[str]]): Optional list of domain filters for the search.
+    """
+
+    def __init__(
+        self,
+        model: str = "sonar",
+        api_key: Optional[str] = None,
+        max_tokens: int = 1000,
+        search_domain_filter: Optional[list[str]] = None,
+    ):
+        """
+        Initializes a new instance of the PerplexitySearchTool.
+
+        Args:
+            model (str, optional): The model to use. Defaults to "sonar".
+            api_key (Optional[str], optional): API key for authentication.
+            max_tokens (int, optional): Maximum number of tokens for the response. Defaults to 1000.
+            search_domain_filter (Optional[list[str]], optional): list of domain filters to restrict search.
+
+        Raises:
+            ValueError: If the API key is missing, the model is empty, max_tokens is not positive,
+                        or if search_domain_filter is not a list when provided.
+        """
+        self.api_key = api_key or os.getenv("PERPLEXITY_API_KEY")
+        self._validate_tool_config(model, self.api_key, max_tokens, search_domain_filter)
+        self.url = "https://api.perplexity.ai/chat/completions"
+        self.model = model
+        self.max_tokens = max_tokens
+        self.search_domain_filters = search_domain_filter
+        super().__init__(
+            name="perplexity-search",
+            description="Perplexity AI search tool for web search, news search, and conversational search "
+            "for finding answers to everyday questions, conducting in-depth research and analysis.",
+            func_or_tool=self.search,
+        )
+
+    @staticmethod
+    def _validate_tool_config(
+        model: str, api_key: Union[str, None], max_tokens: int, search_domain_filter: Union[list[str], None]
+    ) -> None:
+        """
+        Validates the configuration parameters for the search tool.
+
+        Args:
+            model (str): The model to use.
+            api_key (Union[str, None]): The API key for authentication.
+            max_tokens (int): Maximum tokens allowed.
+            search_domain_filter (Union[list[str], None]): Domain filters for search.
+
+        Raises:
+            ValueError: If the API key is missing, model is empty, max_tokens is not positive,
+                        or search_domain_filter is not a list.
+        """
+        if not api_key:
+            raise ValueError("Perplexity API key is missing")
+        if not model:
+            raise ValueError("model cannot be empty")
+        if max_tokens <= 0:
+            raise ValueError("max_tokens must be positive")
+        if search_domain_filter is not None and not isinstance(search_domain_filter, list):
+            raise ValueError("search_domain_filter must be a list")
+
+    def _execute_query(self, payload: dict[str, Any]) -> "PerplexityChatCompletionResponse":
+        """
+        Executes a query by sending a POST request to the Perplexity API.
+
+        Args:
+            payload (dict[str, Any]): The payload to send in the API request.
+
+        Returns:
+            PerplexityChatCompletionResponse: Parsed response from the Perplexity API.
+
+        Raises:
+            RuntimeError: If there is a network error, HTTP error, JSON parsing error, or if the response
+                          cannot be parsed into a PerplexityChatCompletionResponse.
+        """
+        headers = {"Authorization": f"Bearer {self.api_key}", "Content-Type": "application/json"}
+        response = requests.request("POST", self.url, json=payload, headers=headers, timeout=10)
+        try:
+            response.raise_for_status()
+        except requests.exceptions.Timeout as e:
+            raise RuntimeError(
+                f"Perplexity API => Request timed out: {response.text}. Status code: {response.status_code}"
+            ) from e
+        except requests.exceptions.HTTPError as e:
+            raise RuntimeError(
+                f"Perplexity API => HTTP error occurred: {response.text}. Status code: {response.status_code}"
+            ) from e
+        except requests.exceptions.RequestException as e:
+            raise RuntimeError(
+                f"Perplexity API => Error during request: {response.text}. Status code: {response.status_code}"
+            ) from e
+
+        try:
+            response_json = response.json()
+        except json.JSONDecodeError as e:
+            raise RuntimeError(f"Perplexity API => Invalid JSON response received. Error: {e}") from e
+
+        try:
+            # This may raise a pydantic.ValidationError if the response structure is not as expected.
+            perp_resp = PerplexityChatCompletionResponse(**response_json)
+        except ValidationError as e:
+            raise RuntimeError("Perplexity API => Validation error when parsing API response: " + str(e)) from e
+        except Exception as e:
+            raise RuntimeError(
+                "Perplexity API => Failed to parse API response into PerplexityChatCompletionResponse: " + str(e)
+            ) from e
+
+        return perp_resp
+
+    def search(self, query: str) -> "SearchResponse":
+        """
+        Perform a search query using the Perplexity AI API.
+
+        Constructs the payload, executes the query, and parses the response to return
+        a concise search result along with any provided citations.
+
+        Args:
+            query (str): The search query.
+
+        Returns:
+            SearchResponse: A model containing the search result content and citations.
+
+        Raises:
+            ValueError: If the search query is invalid.
+            RuntimeError: If there is an error during the search process.
+        """
+        if not query or not isinstance(query, str):
+            raise ValueError("A valid non-empty query string must be provided.")
+
+        payload = {
+            "model": self.model,
+            "messages": [{"role": "system", "content": "Be precise and concise."}, {"role": "user", "content": query}],
+            "max_tokens": self.max_tokens,
+            "search_domain_filter": self.search_domain_filters,
+            "web_search_options": {"search_context_size": "high"},
+        }
+
+        try:
+            perplexity_response = self._execute_query(payload)
+            content = perplexity_response.choices[0].message.content
+            citations = perplexity_response.citations
+            return SearchResponse(content=content, citations=citations, error=None)
+        except Exception as e:
+            # Return a SearchResponse with an error message if something goes wrong.
+            return SearchResponse(content=None, citations=None, error=f"{e}")
diff --git a/mm_agents/coact/autogen/tools/experimental/reliable/__init__.py b/mm_agents/coact/autogen/tools/experimental/reliable/__init__.py
new file mode 100644
index 0000000..4185637
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/reliable/__init__.py
@@ -0,0 +1,10 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from .reliable import ReliableTool, ReliableToolError, SuccessfulExecutionParameters, ToolExecutionDetails
+
+__all__ = ["ReliableTool", "ReliableToolError", "SuccessfulExecutionParameters", "ToolExecutionDetails"]
diff --git a/mm_agents/coact/autogen/tools/experimental/reliable/reliable.py b/mm_agents/coact/autogen/tools/experimental/reliable/reliable.py
new file mode 100644
index 0000000..ffa89b7
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/reliable/reliable.py
@@ -0,0 +1,1316 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+import asyncio
+import contextlib
+import copy
+import functools
+import inspect
+import json
+import logging
+import time
+import warnings
+from typing import Annotated, Any, Callable, Dict, List, Optional, Tuple, Type, Union
+
+from pydantic import BaseModel, ConfigDict, Field, ValidationError
+
+from ....agentchat import ChatResult, initiate_group_chat
+from ....agentchat.agent import Agent
+from ....agentchat.conversable_agent import ConversableAgent
+from ....agentchat.group import AgentTarget, ReplyResult, TerminateTarget
+from ....agentchat.group.context_variables import ContextVariables
+from ....agentchat.group.patterns import DefaultPattern
+from ....doc_utils import export_module
+from ....llm_config import LLMConfig
+from ....tools.dependency_injection import Field as AG2Field
+from ....tools.tool import Tool
+
+__all__ = ("ReliableTool", "ReliableToolError", "SuccessfulExecutionParameters", "ToolExecutionDetails")
+
+logger = logging.getLogger(__name__)
+
+HYPOTHESIS_DESCRIPTION = (
+    "A clear, concise statement about the expected outcome or result format of the function call "
+    "based on the provided inputs. This helps in assessing the relevance and potential success "
+    "of the call, and guides validation."
+)
+
+
+class ValidationResult(BaseModel):
+    """Represents the outcome of a single validation step."""
+
+    model_config = ConfigDict(extra="forbid")
+    validation_result: bool
+    justification: str
+
+    def __str__(self) -> str:
+        status = "Passed" if self.validation_result else "Failed"
+        return f"Validation Result: {status}\nJustification: {self.justification}"
+
+    def format(self) -> str:
+        """Returns the JSON representation for AutoGen compatibility."""
+        return self.model_dump_json()
+
+
+class ExecutionAttempt(BaseModel):
+    """Stores the state of a single attempt to execute and validate the function."""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    timestamp: float = Field(default_factory=time.time)
+    attempt_args: List[Any] = Field(default_factory=list)
+    attempt_kwargs: Dict[str, Any] = Field(default_factory=dict)
+    hypothesis: Optional[str] = None
+    error: Optional[str] = None
+    result_data: Optional[Any] = None
+    result_str: Optional[str] = None
+    validation: Optional[ValidationResult] = None
+
+    @property
+    def did_execute_successfully(self) -> bool:
+        """Check if the attempt executed without raising an error."""
+        return self.error is None
+
+    @property
+    def did_validate_successfully(self) -> bool:
+        """Check if the attempt passed validation."""
+        return self.validation is not None and self.validation.validation_result
+
+
+class ReliableToolContext(BaseModel):
+    """Main context object holding the overall state and history of attempts."""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    task: str
+    reliable_tool_name: str
+    start_time: float = Field(default_factory=time.time)
+    dynamic_validation_input: Optional[str] = None
+    attempts: List[ExecutionAttempt] = Field(default_factory=list)
+    initial_messages: Optional[List[dict[str, Any]]] = Field(
+        default=None, description="Initial messages provided to the tool run."
+    )
+    initial_ground_truth: Optional[List[str]] = Field(
+        default=None, description="Initial ground truth strings provided."
+    )
+
+    @property
+    def attempt_count(self) -> int:
+        """Return the number of attempts made."""
+        return len(self.attempts)
+
+    @property
+    def latest_attempt(self) -> Optional[ExecutionAttempt]:
+        """Return the most recent attempt, if any."""
+        return self.attempts[-1] if self.attempts else None
+
+    @property
+    def is_complete_and_successful(self) -> bool:
+        """Check if the process finished with a validated successful attempt."""
+        latest = self.latest_attempt
+        return latest is not None and latest.did_execute_successfully and latest.did_validate_successfully
+
+    def get_final_result_data(self) -> Any:
+        """Return the result_data from the successful and validated attempt."""
+        if self.is_complete_and_successful and self.latest_attempt:
+            return self.latest_attempt.result_data
+        return None
+
+    def get_final_result_str(self) -> Any:
+        """Return the result_str from the successful and validated attempt."""
+        if self.is_complete_and_successful and self.latest_attempt:
+            return self.latest_attempt.result_str
+        return None
+
+    def get_failure_summary(self) -> str:
+        """Provide a summary of why the overall execution failed."""
+        latest = self.latest_attempt
+        if latest is None:
+            return "No execution attempts were made."
+        if not latest.did_execute_successfully:
+            return f"Execution failed: {latest.error}"
+        if not latest.did_validate_successfully:
+            justification = (
+                latest.validation.justification if latest.validation else "Validation result missing or invalid"
+            )
+            return f"Execution succeeded but failed validation (Justification: {justification})"
+        return "Execution completed but overall status indicates failure (Internal inconsistency)."
+
+
+class SuccessfulExecutionParameters(BaseModel):
+    """Holds the arguments of a successful tool function execution."""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    attempt_args: List[Any]
+    attempt_kwargs: Dict[str, Any]
+
+
+class ToolExecutionDetails(BaseModel):
+    """Provides detailed information about a ReliableTool execution."""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    task: str
+    is_overall_successful: bool
+    failure_reason: Optional[str] = None
+    successful_parameters: Optional[SuccessfulExecutionParameters] = None
+    final_tool_context: ReliableToolContext
+
+
+def _configure_llm_for_structured_output(
+    llm_config: Optional[Union[LLMConfig, dict[str, Any]]], structured_output_type: Type[BaseModel]
+) -> Union[LLMConfig, dict[str, Any]]:  # Return type changed, False is no longer a valid return
+    """Configure LLM config for structured output using a Pydantic model."""
+    if llm_config is None or llm_config is False:
+        raise ValueError("LLMConfig cannot be None or False for structured output.")
+    if not issubclass(structured_output_type, BaseModel):
+        raise TypeError(f"{structured_output_type} must be a Pydantic BaseModel subclass.")
+
+    llm_config_obj = ConversableAgent._validate_llm_config(llm_config)
+
+    if llm_config_obj is False:  # Should not happen if input llm_config is not False
+        raise ValueError("Validated LLMConfig resolved to False unexpectedly.")
+
+    response_format_set = False
+
+    def _set_format_and_remove_conflicts(config_item: Union[LLMConfig, Dict[str, Any]]) -> None:
+        nonlocal response_format_set
+        conflicting_keys = ["tools", "tool_choice", "functions"]
+        removed_keys = []
+
+        if isinstance(config_item, dict):
+            config_item["response_format"] = structured_output_type
+            response_format_set = True
+            for key in conflicting_keys:
+                if key in config_item:
+                    del config_item[key]
+                    removed_keys.append(key)
+        elif hasattr(config_item, "response_format"):  # LLMConfig object
+            setattr(config_item, "response_format", structured_output_type)
+            response_format_set = True
+            for key in conflicting_keys:
+                if hasattr(config_item, key) and getattr(config_item, key, None):
+                    # Try setting to None or empty list/dict as appropriate
+                    default_empty: Optional[List[str]] = [] if key in ["tools", "functions"] else None
+                    setattr(config_item, key, default_empty)
+                    removed_keys.append(key)
+        else:
+            # This case implies llm_config_obj is an object not fitting LLMConfig ducktype for response_format
+            # or not a dict, which should be caught by _validate_llm_config or earlier checks.
+            raise TypeError(f"Unsupported LLM config item type for structured output: {type(config_item)}")
+
+        if removed_keys:
+            logger.debug(
+                "Removed conflicting keys %s from LLM config for structured output (response_format=%s)",
+                removed_keys,
+                structured_output_type.__name__,
+            )
+
+    _set_format_and_remove_conflicts(llm_config_obj)
+
+    if not response_format_set and not isinstance(llm_config_obj, dict):  # Double check if it's an object
+        # if it's an object and response_format could not be set, it's an issue.
+        # For dicts, it's assumed to be set by _set_format_and_remove_conflicts.
+        raise ValueError(
+            f"LLMConfig object type ({type(llm_config_obj).__name__}) "
+            "could not have 'response_format' set. Structured output may fail."
+        )
+
+    # Handle config_list if present
+    config_list_attr_name = "config_list"
+    original_config_list = None
+
+    if isinstance(llm_config_obj, dict):
+        original_config_list = llm_config_obj.get(config_list_attr_name)
+    elif hasattr(llm_config_obj, config_list_attr_name):
+        original_config_list = getattr(llm_config_obj, config_list_attr_name, None)
+
+    if isinstance(original_config_list, list):
+        new_config_list = []
+        for item in original_config_list:
+            item_copy = copy.deepcopy(item)
+            # Assuming items in config_list are dicts or LLMConfig-like objects
+            _set_format_and_remove_conflicts(item_copy)
+            new_config_list.append(item_copy)
+
+        if isinstance(llm_config_obj, dict):
+            llm_config_obj[config_list_attr_name] = new_config_list
+        else:  # Must be an object if hasattr was true
+            setattr(llm_config_obj, config_list_attr_name, new_config_list)
+
+    logger.debug("Prepared LLM config for validator (response_format=%s)", structured_output_type.__name__)
+    return llm_config_obj
+
+
+def _get_last_non_empty_message_content(messages: Optional[List[dict[str, Any]]]) -> Optional[str]:
+    """Get content of the last message with non-empty content."""
+    if not messages:
+        return None
+    for message in reversed(messages):
+        content = message.get("content")
+        if isinstance(content, str) and content.strip():
+            return content.strip()
+        if isinstance(content, list) and content:  # Handle multimodal content
+            # Prioritize text parts
+            text_parts = [
+                item["text"].strip()
+                for item in content
+                if isinstance(item, dict)
+                and item.get("type") == "text"
+                and isinstance(item.get("text"), str)
+                and item["text"].strip()
+            ]
+            if text_parts:
+                return "\n".join(text_parts)
+
+            # If no text parts, serialize the first non-empty item
+            for item in content:
+                if item:  # Ensure item is not None or empty
+                    if isinstance(item, dict):
+                        return json.dumps(item)
+                    else:
+                        return str(item).strip()
+    return None
+
+
+def _get_reliable_tool_context(context_variables: ContextVariables, context_key: str) -> ReliableToolContext:
+    """Retrieve and validate the ReliableToolContext from ContextVariables."""
+    context_data = context_variables.get(context_key)
+    if context_data is None:
+        raise KeyError(f"ReliableToolContext key '{context_key}' not found in ContextVariables.")
+    try:
+        if isinstance(context_data, str):
+            return ReliableToolContext.model_validate_json(context_data)
+        raise TypeError(
+            f"Unexpected type {type(context_data)} for context key '{context_key}'. Expected ReliableToolContext, str, or dict."
+        )
+    except (ValidationError, json.JSONDecodeError, TypeError) as e:
+        preview = f" Preview: '{str(context_data)[:100]}...'" if isinstance(context_data, (str, dict)) else ""
+        # Logged error level changed to warning as this function re-raises.
+        logger.warning(
+            "Failed loading ReliableToolContext '%s'. Error: %s. Type: %s.%s",
+            context_key,
+            e,
+            type(context_data).__name__,
+            preview,
+        )
+        raise ValueError(f"Failed loading ReliableToolContext key '{context_key}': {e}") from e
+
+
+def _set_reliable_tool_context(
+    context_variables: ContextVariables, context_key: str, context: ReliableToolContext
+) -> None:
+    """Serialize and store the ReliableToolContext in ContextVariables."""
+    if not isinstance(context, ReliableToolContext):
+        raise TypeError(f"Object to set must be a ReliableToolContext, got {type(context)}.")
+    try:
+        context_variables[context_key] = context.model_dump_json(warnings="warn")
+    except (ValidationError, TypeError) as e:  # More specific exceptions
+        context_dict_str = "N/A"
+        try:  # Best effort to get some context info for logging
+            context_dict_str = str(context.model_dump(warnings="warn", exclude={"attempts"}))[:500]
+        except Exception:
+            contextlib.suppress(Exception)
+        logger.error(  # Log as error as this is a critical serialization failure
+            "Failed serializing ReliableToolContext key '%s': %s. Context (partial): %s",
+            context_key,
+            e,
+            context_dict_str,
+        )
+        raise ValueError(f"Critical error serializing ReliableToolContext: {e}") from e
+
+
+def get_runner_prompt(task: str, agent_system_message: str, internal_tool_name: str) -> str:
+    """Generate the system prompt for the internal runner agent."""
+    return f"""
+You are an AI assistant responsible for invoking a specific function based on the user's task and conversation history.
+Function to call: '{internal_tool_name}'
+Analyze the previous attempt's outcome (if any, visible in history) and adjust the function arguments accordingly for this retry. If this is the first attempt, determine the best initial arguments based on the task and initial context.
+
+You MUST invoke the function '{internal_tool_name}' exactly one time per response using a tool call format that the system can execute.
+Do NOT just output text explaining what you would do, or asking for confirmation. Directly make the tool call.
+Analyze the task description and *full conversation history* carefully to determine the correct arguments for the function call.
+You MUST provide a 'hypothesis' argument summarizing the expected outcome or result format of the function call based on the inputs.
+
+Base Instructions:
+{agent_system_message}
+
+Current Task:
+{task}
+"""
+
+
+def get_validator_prompt(
+    task: str, base_validator_system_message: str, dynamic_validation_addition: Optional[str] = None
+) -> str:
+    """Generate the system prompt for the internal validator agent."""
+    dynamic_section = (
+        f"\n\nAdditional Dynamic Requirements for This Specific Run:\n{dynamic_validation_addition.strip()}"
+        if dynamic_validation_addition and dynamic_validation_addition.strip()
+        else ""
+    )
+    return f"""
+You are an AI validation assistant. You will receive a curated message list containing:
+1. Initial context messages (original request, potentially prior conversation).
+2. Provided ground truth information (if any).
+3. The final result of a function call intended to accomplish the task.
+
+Your goal is to validate if the *final function call result* meets ALL requirements based on the *entire context provided in the message list*. Consider the base task description, base validation rules, initial context/ground truth, and any dynamic requirements below.
+
+Evaluate the *final function call result* (presented at the end of the message list) based on *all* information provided.
+
+Base Validation Rules/Context:
+{base_validator_system_message}{dynamic_section}
+
+Base Task Description (for reference):
+{task}
+"""
+
+
+def reliable_function_wrapper(
+    tool_function: Callable[..., Any], validator: ConversableAgent, runner: ConversableAgent, context_variables_key: str
+) -> Callable[..., Any]:
+    """Wraps the target function, returning a sync or async wrapper.
+
+    Adds 'hypothesis' and 'context_variables' keyword-only arguments.
+    Returns a ReplyResult targeting the validator.
+    """
+    is_original_func_async = inspect.iscoroutinefunction(tool_function)
+    tool_sig = inspect.signature(tool_function)
+    wrapper_func: Callable[..., Any]  # Declare type for wrapper_func
+
+    def _handle_execution_error(
+        attempt: ExecutionAttempt, context_vars: ContextVariables, context: ReliableToolContext, e: Exception
+    ) -> ReplyResult:
+        """Shared logic to handle tool_function execution error."""
+        err_msg = f"{type(e).__name__}: {e}"
+        logger.error(  # Log the error from the wrapped function
+            "Wrapped function '%s' execution error: %s",
+            getattr(tool_function, "__name__", "unknown_func"),
+            err_msg,
+            exc_info=True,  # Include traceback for wrapped function error
+        )
+        attempt.error = err_msg
+        if attempt not in context.attempts:
+            context.attempts.append(attempt)
+
+        _set_reliable_tool_context(context_vars, context_variables_key, context)
+
+        # Go to runner in this scenario because an error can just be handled by the runner again
+        return ReplyResult(
+            context_variables=context_vars,
+            target=AgentTarget(runner),
+            message=f"Function execution failed with error: {err_msg}.",
+        )
+
+    def _process_successful_execution(
+        attempt: ExecutionAttempt, result: Any, context_vars: ContextVariables, context: ReliableToolContext
+    ) -> ReplyResult:
+        value_to_stringify: Any = None
+
+        if isinstance(result, tuple):
+            if len(result) >= 2:
+                attempt.result_data = result[0]
+                value_to_stringify = result[1]
+            elif len(result) == 1:
+                attempt.result_data = result[0]
+                value_to_stringify = result[0]
+            else:
+                attempt.result_data = None
+                value_to_stringify = ""
+
+        else:
+            attempt.result_data = result
+            value_to_stringify = result
+
+        try:
+            attempt.result_str = str(value_to_stringify) if value_to_stringify is not None else ""
+        except Exception as str_e:
+            logger.warning(
+                "Could not convert result string part to string, using repr() \n %s",
+                str_e,
+            )
+            attempt.result_str = repr(value_to_stringify)
+
+        if attempt not in context.attempts:
+            context.attempts.append(attempt)
+
+        _set_reliable_tool_context(context_vars, context_variables_key, context)
+
+        return ReplyResult(
+            context_variables=context_vars,
+            target=AgentTarget(validator),
+            message=attempt.result_str,
+        )
+
+    if not is_original_func_async:
+
+        @functools.wraps(tool_function)
+        def sync_wrapper(
+            *args: Any, hypothesis: str, context_variables: ContextVariables, **kwargs: Any
+        ) -> ReplyResult:
+            context = _get_reliable_tool_context(context_variables, context_variables_key)
+            attempt = ExecutionAttempt(attempt_args=list(args), attempt_kwargs=kwargs, hypothesis=hypothesis)
+            try:
+                result = tool_function(*args, **kwargs)
+                return _process_successful_execution(attempt, result, context_variables, context)
+            except Exception as e:
+                return _handle_execution_error(attempt, context_variables, context, e)
+
+        wrapper_func = sync_wrapper
+    else:
+
+        @functools.wraps(tool_function)
+        async def async_wrapper(
+            *args: Any, hypothesis: str, context_variables: ContextVariables, **kwargs: Any
+        ) -> ReplyResult:
+            context = _get_reliable_tool_context(context_variables, context_variables_key)
+            attempt = ExecutionAttempt(attempt_args=list(args), attempt_kwargs=kwargs, hypothesis=hypothesis)
+            try:
+                result = await tool_function(*args, **kwargs)
+                return _process_successful_execution(attempt, result, context_variables, context)
+            except Exception as e:
+                return _handle_execution_error(attempt, context_variables, context, e)
+
+        wrapper_func = async_wrapper
+
+    params = list(tool_sig.parameters.values())
+    pos_or_kw_params, kw_only_params, var_pos_param, var_kw_param = [], [], None, None
+    for p in params:
+        if p.kind == inspect.Parameter.POSITIONAL_ONLY or p.kind == inspect.Parameter.POSITIONAL_OR_KEYWORD:
+            pos_or_kw_params.append(p)
+        elif p.kind == inspect.Parameter.VAR_POSITIONAL:
+            var_pos_param = p
+        elif p.kind == inspect.Parameter.KEYWORD_ONLY:
+            kw_only_params.append(p)
+        elif p.kind == inspect.Parameter.VAR_KEYWORD:
+            var_kw_param = p
+
+    new_kw_only_params = [
+        inspect.Parameter(
+            "hypothesis",
+            inspect.Parameter.KEYWORD_ONLY,
+            annotation=Annotated[str, AG2Field(description=HYPOTHESIS_DESCRIPTION)],
+            default=inspect.Parameter.empty,
+        ),
+        inspect.Parameter(
+            "context_variables",
+            inspect.Parameter.KEYWORD_ONLY,
+            annotation=ContextVariables,
+            default=inspect.Parameter.empty,
+        ),
+    ]
+
+    wrapper_params = (
+        pos_or_kw_params
+        + ([var_pos_param] if var_pos_param else [])
+        + kw_only_params
+        + new_kw_only_params
+        + ([var_kw_param] if var_kw_param else [])
+    )
+    setattr(wrapper_func, "__signature__", inspect.Signature(parameters=wrapper_params, return_annotation=ReplyResult))
+    return wrapper_func
+
+
+@export_module("autogen.tools.experimental")
+class ReliableToolError(Exception):
+    """Custom exception for errors during ReliableTool execution."""
+
+    def __init__(self, message: str, final_context: Optional[ReliableToolContext] = None):
+        super().__init__(message)
+        self.final_context = final_context
+
+
+@export_module("autogen.tools.experimental")
+class ReliableTool(Tool):
+    INTERNAL_TOOL_NAME_PREFIX = "execute_"
+
+    def __init__(
+        self,
+        name: str,
+        func_or_tool: Union[Callable[..., Any], Tool],
+        runner_llm_config: Union[LLMConfig, dict[str, Any]],
+        validator_llm_config: Union[LLMConfig, dict[str, Any]],
+        description: Optional[str] = None,
+        system_message_addition_for_tool_calling: str = "",
+        system_message_addition_for_result_validation: str = "",
+        max_tool_invocations: int = 3,
+        enable_dynamic_validation: bool = False,
+        messages: Optional[List[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> None:
+        """
+        A ReliableTool wraps an existing function or tool.
+        When the ReliableTool is invoked, it kicks off an internal Group Chat where a Runner
+        and Validator agent will iteratively invoke the wrapped function or tool until
+        *the output of a single invocation of the original function or tool satisfies the provided validation criteria.*
+        Reliable Tools are best used when the LLM used or the function or tool itself is unreliable.
+        Commonly this happens when using small, local LLMs, <32b params
+        Or when functions/tools are used to "explore" (doing many web searches, exploring a database with SQL)
+        The Reliable Tool allows the user to bake a result validation strategy into the tool itself
+        so that the broader group chat/agentic system can be built more clearly around the intended flow
+        instead of needing to focus so much on retry and validation loops.
+
+        Additionally, the .run() and .a_run() methods serve as a way to use LLMs to invoke a specific tool outside
+        of a Group Chat or similar structure to provide a more traditional programming method of using LLMs and tools in code.
+
+        Args:
+            name (str):
+                A unique and descriptive name for this ReliableTool instance.
+                This name is used for logging, internal context management, and can be
+                how other agents or systems refer to this specific reliable capability.
+                Example: `"AccurateWeatherForecaster"`, `"ValidatedCustomerLookup"`
+
+            func_or_tool (Union[Callable[..., Any], Tool]):
+                The core Python function or an existing AG2 `Tool` instance that this
+                `ReliableTool` will manage and execute. This is the underlying capability
+                you want to enhance with reliability features like retries and validation.
+                The `ReliableTool` will handle calling this function with arguments
+                determined by its internal Runner Agent based on the provided `task`.
+                Example: `my_api_call_function`, `existing_search_tool_instance`
+
+            runner_llm_config (Union[LLMConfig, dict[str, Any]]):
+                The LLM configuration for the internal "Runner Agent". This agent is
+                responsible for interpreting the high-level `task` provided when the
+                `ReliableTool` is invoked, deciding the appropriate arguments for the
+                `func_or_tool`, and initiating its execution.
+                This configuration dictates the model, API keys, temperature, etc., for
+                the LLM that attempts to call your function. It must support tool/function calling.
+                Example: `LLMConfig(config_list=oai_config_list, model="gpt-4o-mini")`
+                         `{"config_list": [{"model": "gpt-3.5-turbo", "api_key": "..."}], "temperature": 0.5}`
+
+            validator_llm_config (Union[LLMConfig, dict[str, Any]]):
+                The LLM configuration for the internal "Validator Agent". After the
+                `func_or_tool` executes successfully, this agent receives its string output
+                and assesses whether it meets defined validation criteria. It is
+                configured for structured output (Pydantic model `ValidationResult`)
+                to provide a boolean validation status and a justification.
+                This configuration dictates the model, etc., for the LLM that validates
+                the function's result. It can be the same as `runner_llm_config` or different.
+                Example: `LLMConfig(config_list=oai_config_list, model="gpt-4o-mini")`
+
+            description (Optional[str], default: None):
+                A human-readable description of what this `ReliableTool` achieves.
+                If `None`, the description is inferred from the docstring of the
+                provided `func_or_tool`. This description is primarily for the public-facing
+                `ReliableTool` (e.g., when registered with an outer agent for it to decide
+                when to use this tool).
+                Example: `"Reliably fetches and validates current weather information for a specified city."`
+
+            system_message_addition_for_tool_calling (str, default: ""):
+                Additional text appended to the system message of the internal "Runner Agent".
+                This allows you to provide specific instructions, context, or constraints
+                to the LLM responsible for deciding *how* to call your underlying `func_or_tool`.
+                Use this when the Runner Agent needs more guidance than just the task
+                description and the function's signature to correctly formulate arguments.
+                Example: `"When calling 'search_products', if the task mentions 'budget', ensure the 'max_price' argument is set accordingly. Prioritize items in stock."`
+
+            system_message_addition_for_result_validation (str, default: ""):
+                Additional text appended to the system message of the internal "Validator Agent".
+                This is where you define the *base* or *static* criteria for validating the
+                *result* (string representation) of your `func_or_tool`. These criteria
+                are applied on every validation attempt unless overridden or supplemented by
+                dynamic validation.
+                Example: `"The stock price must be a positive number. The company name in the result must match the one in the task. If data is unavailable, the result should explicitly state 'Data not found'."`
+
+            max_tool_invocations (int, default: 3):
+                The maximum number of times the internal "Runner Agent" can attempt to
+                call the underlying `func_or_tool`. This limit includes the initial attempt
+                and any subsequent retries that occur due to:
+                1. Direct execution errors from `func_or_tool`.
+                2. The Runner Agent failing to generate a valid tool call.
+                3. The Validator Agent deeming a successful execution's result as invalid.
+                Adjust this to control retries and prevent excessive LLM calls, considering
+                the potential flakiness of the `func_or_tool` or complexity of parameterization.
+                Example: `max_tool_invocations=2` (allows one initial attempt and one retry if needed).
+
+            enable_dynamic_validation (bool, default: False):
+                If `True`, the public-facing `run` (or `a_run`) method of this `ReliableTool`
+                (accessible via its `func` attribute after initialization) will accept an
+                additional optional argument: `validation_prompt_addition: Optional[str]`.
+                If a string is provided for this argument during a call, it will be appended
+                to the Validator Agent's system message *for that specific run*, allowing
+                validation criteria to be tailored on-the-fly based on the task.
+                Example: If `True`, `my_tool.func(task="search for AG2 examples", validation_prompt_addition="Result must include Python code snippets.")`
+
+            messages (Optional[List[dict[str, Any]]], default: None):
+                A list of initial messages (e.g., from a prior conversation history) to
+                provide context to the internal Runner and Validator agents. These messages
+                are prepended to the message history seen by these agents during their
+                internal chat, helping them understand the `task` in a broader context.
+                Use when the `task` for the `ReliableTool` might refer to entities or
+                intentions established in preceding turns of a conversation.
+                Example: `messages=[{"role": "user", "content": "I'm interested in large-cap tech stocks."}, {"role": "assistant", "content": "Okay, any specific ones?"}]`
+                         (Then a task like "Fetch the latest price for 'the one we just discussed'.")
+
+            ground_truth (Optional[List[str]], default: None):
+                A list of strings representing factual information, examples, or specific
+                constraints that should be considered by the internal Runner and Validator
+                agents. These are injected into the conversation history as distinct user
+                messages (e.g., "[[Provided Ground Truth 1]]: ...").
+                Use to provide specific, factual data or strong hints that might not fit
+                naturally into system messages or prior conversation history, guiding the
+                agents towards correct interpretation or validation.
+                Example: `ground_truth=["The API rate limit is 10 requests per minute.", "User preference: only show results from the last 7 days."]`
+        """
+        self._original_func, original_name, original_description = self._extract_func_details(func_or_tool)
+        self._is_original_func_async = inspect.iscoroutinefunction(self._original_func)
+
+        self._runner_llm_config = ConversableAgent._validate_llm_config(runner_llm_config)
+        if self._runner_llm_config is False:
+            raise ValueError("Runner LLM config failed validation.")
+        # Validate validator_llm_config and store it. It can be LLMConfig | dict | False.
+        self._validator_llm_config = ConversableAgent._validate_llm_config(validator_llm_config)
+        if self._validator_llm_config is False:  # Check before use in _setup_validator_agent
+            raise ValueError("Validator LLM config failed validation.")
+
+        self._runner_system_message_addition = system_message_addition_for_tool_calling
+        self._validator_system_message_addition = system_message_addition_for_result_validation
+        self.max_tool_invocations = max_tool_invocations
+        self._context_variables_key = f"{name}_ReliableToolContext_{id(self)}"
+
+        self._original_func_name = original_name
+        self.enable_dynamic_validation = enable_dynamic_validation
+
+        self._init_messages = copy.deepcopy(messages) if messages is not None else None
+        self._init_ground_truth = copy.deepcopy(ground_truth) if ground_truth else None
+
+        self._tool_description = description if description is not None else original_description
+
+        public_entry_point_func = self._define_public_entry_point(
+            self._is_original_func_async, self.enable_dynamic_validation
+        )
+
+        super().__init__(
+            name=name,
+            description=self._tool_description,
+            func_or_tool=public_entry_point_func,
+        )
+
+        self._validator_name = f"{self.name}_Validator"
+        self._runner_name = f"{self.name}_Runner"
+
+        self._validator = self._setup_validator_agent()
+        self._runner = self._setup_runner_agent()
+        self._reliable_func_wrapper = reliable_function_wrapper(
+            self._original_func, self._validator, self._runner, self._context_variables_key
+        )
+        self._setup_runner_tool()
+        self._register_internal_hooks()
+
+    def _define_public_entry_point(self, is_async: bool, enable_dynamic: bool) -> Callable[..., Any]:
+        if not is_async:
+            if enable_dynamic:
+
+                def sync_entry_point_with_validation(
+                    task: str, validation_prompt_addition: Optional[str] = None
+                ) -> Any:
+                    return self.run(task=task, validation_prompt_addition=validation_prompt_addition)
+
+                return sync_entry_point_with_validation
+            else:
+
+                def sync_entry_point_without_validation(task: str) -> Any:
+                    return self.run(task=task, validation_prompt_addition=None)
+
+                return sync_entry_point_without_validation
+        else:
+            if enable_dynamic:
+
+                async def async_entry_point_with_validation(
+                    task: str, validation_prompt_addition: Optional[str] = None
+                ) -> Any:
+                    return await self.a_run(task=task, validation_prompt_addition=validation_prompt_addition)
+
+                return async_entry_point_with_validation
+            else:
+
+                async def async_entry_point_without_validation(task: str) -> Any:
+                    return await self.a_run(task=task, validation_prompt_addition=None)
+
+                return async_entry_point_without_validation
+
+    def _extract_func_details(
+        self, func_or_tool: Union[Callable[..., Any], Tool]
+    ) -> Tuple[Callable[..., Any], str, str]:
+        default_desc_template = "Executes the '{name}' function."
+        if isinstance(func_or_tool, Tool):
+            func = getattr(func_or_tool, "func", None)
+            if not callable(func):
+                raise TypeError(
+                    f"Tool '{func_or_tool.name}' provided but its 'func' attribute is not callable or missing."
+                )
+            name = func_or_tool.name
+            desc = func_or_tool.description
+            if not desc or desc == f"Tool '{name}'." or desc == "No description provided.":
+                func_doc = inspect.getdoc(func)
+                desc = func_doc.strip() if func_doc else f"{default_desc_template.format(name=name)}"
+            return func, name, desc
+        elif callable(func_or_tool):
+            name = getattr(func_or_tool, "__name__", "callable_function")
+            doc = inspect.getdoc(func_or_tool)
+            desc = doc.strip() if doc else f"{default_desc_template.format(name=name)}"
+            # For raw callables, we don't have a pre-computed schema like Tool object might
+            return func_or_tool, name, desc
+        raise TypeError(
+            "Input 'func_or_tool' must be a callable or an autogen.Tool instance with a callable 'func' attribute."
+        )
+
+    def _setup_validator_agent(self) -> ConversableAgent:
+        # _configure_llm_for_structured_output will raise ValueError if config is bad
+        # Use a local variable for type narrowing after the False check.
+        current_validator_config = self._validator_llm_config
+        if current_validator_config is False:
+            # This case should have been caught in __init__, but as a safeguard:
+            raise ValueError("Validator LLM config is False, cannot proceed.")
+
+        structured_llm_config = _configure_llm_for_structured_output(
+            copy.deepcopy(current_validator_config),  # current_validator_config is not False here
+            ValidationResult,
+        )
+        return ConversableAgent(
+            name=self._validator_name,
+            system_message="[Validator Prompt Updated Per Run]",
+            llm_config=structured_llm_config,
+            human_input_mode="NEVER",
+        )
+
+    def _setup_runner_agent(self) -> ConversableAgent:
+        runner_llm_config_copy = copy.deepcopy(self._runner_llm_config)
+        runner = ConversableAgent(
+            name=self._runner_name,
+            system_message="[Runner Prompt Updated Per Run]",
+            llm_config=runner_llm_config_copy,
+            human_input_mode="NEVER",
+        )
+        return runner
+
+    def _setup_runner_tool(self) -> None:
+        internal_tool_name = f"{self.INTERNAL_TOOL_NAME_PREFIX}{self._original_func_name}"
+        internal_tool = Tool(
+            name=internal_tool_name, description=self._tool_description, func_or_tool=self._reliable_func_wrapper
+        )
+        internal_tool.register_tool(self._runner)
+        logger.info(
+            "Successfully registered internal tool '%s' with runner '%s'", internal_tool_name, self._runner.name
+        )
+
+    def _register_internal_hooks(self) -> None:
+        self._validator.register_hook(
+            hookable_method="process_message_before_send", hook=self._validator_structured_output_hook
+        )
+        self._validator.register_hook(
+            hookable_method="process_all_messages_before_reply", hook=self._validator_construct_context_hook
+        )
+        self._runner.register_hook(hookable_method="process_message_before_send", hook=self._ensure_function_call_hook)
+
+    def _validator_structured_output_hook(
+        self, sender: Agent, message: Union[dict[str, Any], str], recipient: Agent, silent: bool
+    ) -> Union[dict[str, Any], str]:
+        if not isinstance(message, str):
+            logger.error(
+                f"Validator Hook: Expected a JSON string message from LLM, but got {type(message)}. Content: {str(message)[:200]}"
+            )
+            # This indicates a misconfiguration or unexpected LLM output format.
+            raise TypeError(f"Validator hook expected str from LLM, got {type(message)}")
+
+        validation_result_obj: ValidationResult = ValidationResult.model_validate_json(message)
+        status = "PASSED" if validation_result_obj.validation_result else "FAILED"
+        log_level = logging.INFO if status == "PASSED" else logging.WARNING
+        logger.log(
+            log_level,
+            f"Validator Hook: Parsed Validation - {status}. Justification: {validation_result_obj.justification}",
+        )
+
+        self._try_update_context_validation(sender, validation_result_obj)
+        # sender is self._validator in this hook context
+        self._set_validator_handoff(self._validator, validation_result_obj.validation_result)
+        return validation_result_obj.format()  # Return JSON string
+
+    def _set_validator_handoff(self, validator_agent: ConversableAgent, validation_passed: bool) -> None:
+        if not validation_passed:
+            logger.info("Validation failed, setting handoff to runner: %s", self._runner_name)
+            validator_agent.handoffs.set_after_work(target=AgentTarget(self._runner))
+        else:
+            logger.info("Validation passed, setting handoff to TerminateTarget.")
+            validator_agent.handoffs.set_after_work(target=TerminateTarget())
+
+    def _try_update_context_validation(self, sender: Agent, validation_result: ValidationResult) -> None:
+        """Helper to attempt updating the validation state in the ReliableToolContext."""
+        context_vars = getattr(sender, "context_variables")
+
+        tool_context = _get_reliable_tool_context(context_vars, self._context_variables_key)
+        latest_attempt = tool_context.latest_attempt
+
+        if not latest_attempt:
+            # This implies a logical error in the execution flow.
+            raise RuntimeError(
+                f"Validator hook: No execution attempt found in context '{self._context_variables_key}' to update validation for."
+            )
+
+        latest_attempt.validation = validation_result
+        _set_reliable_tool_context(context_vars, self._context_variables_key, tool_context)
+        logger.info(
+            "Validator hook: Updated validation status in context: %s",
+            "Passed" if validation_result.validation_result else "Failed",
+        )
+
+    def _validator_construct_context_hook(self, messages: list[dict[str, Any]], **kwargs: Any) -> list[dict[str, Any]]:
+        sender = self._validator  # Assuming self._validator is the agent instance
+        logger.debug("Validator Construct Context Hook running for agent %s.", sender.name)
+
+        context_vars = getattr(sender, "context_variables")
+
+        tool_context = _get_reliable_tool_context(context_vars, self._context_variables_key)
+        initial_messages_to_inject = (
+            copy.deepcopy(tool_context.initial_messages) if tool_context.initial_messages else []
+        )
+
+        ground_truth_messages_to_inject = []
+        if tool_context.initial_ground_truth:
+            for i, gt in enumerate(tool_context.initial_ground_truth):
+                ground_truth_messages_to_inject.append({
+                    "role": "user",
+                    "content": f"[[Provided Ground Truth {i + 1}]]:\n{gt}",
+                })
+
+        last_content = _get_last_non_empty_message_content(messages)
+        result_message_dict = {
+            "role": "user",
+            "content": f"--- Function Result to Validate ---\n```\n{last_content}\n```\n--- End of Result ---",
+        }
+
+        final_messages = initial_messages_to_inject + ground_truth_messages_to_inject + [result_message_dict]
+        return final_messages
+
+    def _ensure_function_call_hook(
+        self, sender: Agent, message: Union[dict[str, Any], str], recipient: Agent, silent: bool
+    ) -> Union[dict[str, Any], str]:
+        if sender.name != self._runner_name:
+            return message
+
+        tool_calls_list = None
+        if isinstance(message, dict):
+            tool_calls_list = message.get("tool_calls")
+
+        tool_name_expected = f"{self.INTERNAL_TOOL_NAME_PREFIX}{self._original_func_name}"
+        correct_tool_called = False
+        if isinstance(tool_calls_list, list):
+            for call in tool_calls_list:
+                if (
+                    isinstance(call, dict)
+                    and call.get("type") == "function"
+                    and isinstance(call.get("function"), dict)
+                    and call["function"].get("name") == tool_name_expected
+                ):
+                    correct_tool_called = True
+                    break
+
+        if not correct_tool_called:
+            if not hasattr(self._runner, "handoffs"):
+                raise AttributeError(f"Runner agent '{self._runner.name}' missing 'handoffs' attribute for reminder.")
+            self._runner.handoffs.set_after_work(target=AgentTarget(self._runner))  # Retry with runner
+
+            logger.warning(
+                "Runner '%s' did not generate required tool call for '%s'. Appending reminder.",
+                self._runner_name,
+                tool_name_expected,
+            )
+            reminder = (
+                f"\n\n[[System Reminder: You MUST invoke the function '{tool_name_expected}' using a tool call. "
+                "Provide all required arguments including 'hypothesis'.]]\n"
+                "Correct your mistake and make a new attempt at invoking the tool."
+            )
+
+            current_content = ""
+            if isinstance(message, str):
+                current_content = message
+            elif isinstance(message, dict):
+                current_content = message.get("content") or ""
+
+            # Return a new message dict to ensure it's processed correctly by the agent
+            return {
+                "role": "assistant",  # The LLM's previous turn was as assistant
+                "content": (current_content or "") + reminder,
+                "tool_calls": [] if isinstance(message, dict) else None,
+            }
+        return message
+
+    def _execute_internal_group_chat(
+        self,
+        task: str,
+        initial_context_vars: ContextVariables,  # Renamed for clarity
+        dynamic_validation_str: Optional[str] = None,
+    ) -> Tuple[ChatResult, ContextVariables, Agent]:
+        internal_tool_name = f"{self.INTERNAL_TOOL_NAME_PREFIX}{self._original_func_name}"
+
+        # update_system_message should not fail if agent is properly initialized
+        runner_prompt = get_runner_prompt(task, self._runner_system_message_addition, internal_tool_name)
+        self._runner.update_system_message(runner_prompt)
+
+        validator_prompt = get_validator_prompt(task, self._validator_system_message_addition, dynamic_validation_str)
+        self._validator.update_system_message(validator_prompt)
+
+        # Store context ref on agents for hooks. Crucial for hooks to access shared state.
+        self._validator.context_variables = initial_context_vars
+        self._runner.context_variables = initial_context_vars
+
+        messages_for_runner_history = []
+        # Retrieve tool_context again to build runner history with potentially updated initial messages/GT
+        # This is vital if _process_run (the caller) modifies them in initial_context_vars.
+        tool_context = _get_reliable_tool_context(initial_context_vars, self._context_variables_key)
+
+        if tool_context.initial_messages:
+            messages_for_runner_history.extend(copy.deepcopy(tool_context.initial_messages))
+        if tool_context.initial_ground_truth:
+            for i, gt in enumerate(tool_context.initial_ground_truth):
+                messages_for_runner_history.append({
+                    "role": "user",
+                    "content": f"[[Provided Ground Truth {i + 1}]]:\n{gt}",
+                })
+
+        task_message = {
+            "role": "user",
+            "content": f"[[Task Kickoff]]: Please execute the required function call for the task: {task}",
+        }
+        final_initial_messages_for_runner = messages_for_runner_history + [task_message]
+
+        agent_pattern = DefaultPattern(
+            agents=[self._runner, self._validator],
+            initial_agent=self._runner,
+            context_variables=initial_context_vars,
+        )
+
+        max_internal_rounds = 1 + (self.max_tool_invocations * 3)
+        logger.debug(
+            f"Setting max internal chat rounds to {max_internal_rounds} for {self.max_tool_invocations} tool invocations."
+        )
+
+        logger.info(
+            f"--- Starting ReliableTool '{self.name}' Internal Chat (Max Invocations: {self.max_tool_invocations}) ---"
+        )
+
+        last_reply, final_context_vars, last_agent = initiate_group_chat(
+            pattern=agent_pattern,
+            messages=final_initial_messages_for_runner,
+            max_rounds=max_internal_rounds,
+        )
+        logger.info(
+            f"--- ReliableTool '{self.name}' Internal Chat Finished (Last Agent: {getattr(last_agent, 'name', 'N/A')}) ---"
+        )
+        if not isinstance(final_context_vars, ContextVariables):
+            # This would be an unexpected issue with initiate_group_chat or pattern
+            raise TypeError(f"Internal chat returned invalid context_variables type: {type(final_context_vars)}")
+        return last_reply, final_context_vars, last_agent
+
+    def _prepare_tool_context(
+        self,
+        task: str,
+        current_context_variables: ContextVariables,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> ReliableToolContext:
+        """Initializes or updates the ReliableToolContext for the current run."""
+        effective_messages = copy.deepcopy(messages) if messages is not None else self._init_messages
+        effective_ground_truth = copy.deepcopy(ground_truth) if ground_truth is not None else self._init_ground_truth
+
+        tool_context = ReliableToolContext(task=task, reliable_tool_name=self.name)
+
+        tool_context.task = task
+        tool_context.dynamic_validation_input = validation_prompt_addition
+        tool_context.initial_messages = effective_messages
+        tool_context.initial_ground_truth = effective_ground_truth
+
+        _set_reliable_tool_context(current_context_variables, self._context_variables_key, tool_context)
+        return tool_context
+
+    def _process_run(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> Any:
+        current_context_variables = context_variables if context_variables is not None else ContextVariables()
+        if not isinstance(current_context_variables, ContextVariables):
+            raise TypeError(f"Expected context_variables as ContextVariables or None, got {type(context_variables)}")
+
+        self._prepare_tool_context(task, current_context_variables, validation_prompt_addition, messages, ground_truth)
+
+        final_tool_context: ReliableToolContext
+        _, chat_context_variables, _ = self._execute_internal_group_chat(
+            task=task,
+            initial_context_vars=current_context_variables,
+            dynamic_validation_str=validation_prompt_addition,
+        )
+        current_context_variables = chat_context_variables
+
+        final_tool_context = _get_reliable_tool_context(current_context_variables, self._context_variables_key)
+        latest_attempt_obj = final_tool_context.latest_attempt
+
+        if not latest_attempt_obj:
+            raise ReliableToolError(
+                "Critical internal error: No execution attempt recorded after chat cycle.",
+                final_context=final_tool_context,
+            )
+
+        # If execution was successful BUT validation is missing (e.g. validator hook failed to set it)
+        if latest_attempt_obj.did_execute_successfully and latest_attempt_obj.validation is None:
+            logger.warning(
+                "[%s]: Validation result missing after successful execution. Assuming validation failed.", self.name
+            )
+            latest_attempt_obj.validation = ValidationResult(
+                validation_result=False,
+                justification="Validation result was not recorded after successful execution. Usually due to group chat reaching maximum runs",
+            )
+            _set_reliable_tool_context(current_context_variables, self._context_variables_key, final_tool_context)
+
+        if final_tool_context.is_complete_and_successful:
+            logger.info("ReliableTool '%s' succeeded.", self.name)
+            return final_tool_context.get_final_result_data()
+        else:
+            failure_reason = final_tool_context.get_failure_summary()
+            logger.warning("ReliableTool '%s' failed. Reason: %s", self.name, failure_reason)
+            raise ReliableToolError(
+                f"ReliableTool '{self.name}' failed. Last failure: {failure_reason}",
+                final_context=final_tool_context,
+            )
+
+    def run(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> Any:
+        if self._is_original_func_async:
+            raise TypeError(f"Sync 'run()' called for async tool '{self.name}'. Use 'a_run()'.")
+        return self._process_run(
+            task=task,
+            context_variables=context_variables,
+            validation_prompt_addition=validation_prompt_addition,
+            messages=messages,
+            ground_truth=ground_truth,
+        )
+
+    async def a_run(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> Any:
+        if not self._is_original_func_async:
+            warnings.warn(
+                f"Running sync function '{self._original_func_name}' wrapped by ReliableTool '{self.name}' "
+                f"asynchronously using 'a_run()'. The underlying execution of _process_run will be synchronous "
+                f"within an executor.",
+                UserWarning,
+            )
+
+        loop = asyncio.get_running_loop()
+        func_call = functools.partial(
+            self._process_run,
+            task=task,
+            context_variables=context_variables,
+            validation_prompt_addition=validation_prompt_addition,
+            messages=messages,
+            ground_truth=ground_truth,
+        )
+        return await loop.run_in_executor(None, func_call)
+
+    def _process_run_with_details(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> ToolExecutionDetails:
+        current_context_variables = context_variables if context_variables is not None else ContextVariables()
+        if not isinstance(current_context_variables, ContextVariables):
+            err_msg = f"Invalid ContextVariables type: {type(context_variables)}"
+            # Create a minimal context for reporting
+            err_ctx = ReliableToolContext(task=task, reliable_tool_name=self.name)
+            err_ctx.attempts.append(ExecutionAttempt(error=f"Initialization error: {err_msg}"))
+            return ToolExecutionDetails(
+                task=task, is_overall_successful=False, failure_reason=err_msg, final_tool_context=err_ctx
+            )
+
+        tool_context_for_run: ReliableToolContext
+        try:
+            # Initialize or update tool context state. Raises on ser/de errors.
+            tool_context_for_run = self._prepare_tool_context(
+                task, current_context_variables, validation_prompt_addition, messages, ground_truth
+            )
+        except (ValueError, TypeError) as e_ctx_setup:
+            err_msg = f"Error during ReliableToolContext setup: {e_ctx_setup}"
+            logger.error("[%s] %s", self.name, err_msg, exc_info=True)
+            err_ctx = ReliableToolContext(task=task, reliable_tool_name=self.name)
+            err_ctx.attempts.append(ExecutionAttempt(error=f"Context setup error: {e_ctx_setup}"))
+            return ToolExecutionDetails(
+                task=task, is_overall_successful=False, failure_reason=err_msg, final_tool_context=err_ctx
+            )
+
+        # Variables for ToolExecutionDetails
+        is_successful_val = False
+        failure_reason_val = None
+        successful_params_val = None
+        final_tool_context_val: ReliableToolContext = tool_context_for_run  # Start with prepared context
+
+        try:
+            _, chat_context_variables, _ = self._execute_internal_group_chat(
+                task=task,
+                initial_context_vars=current_context_variables,  # This contains the prepared tool_context_for_run
+                dynamic_validation_str=validation_prompt_addition,
+            )
+            current_context_variables = chat_context_variables  # Update with context from chat
+
+            final_tool_context_val = _get_reliable_tool_context(current_context_variables, self._context_variables_key)
+            latest_attempt = final_tool_context_val.latest_attempt
+
+            if not latest_attempt:
+                failure_reason_val = "Critical internal error: No execution attempt recorded after chat cycle."
+                # final_tool_context_val already reflects this state if attempts list is empty
+            elif latest_attempt.did_execute_successfully and latest_attempt.validation is None:
+                logger.warning(
+                    "[%s]: Validation result missing after successful execution. Assuming validation failed.", self.name
+                )
+                latest_attempt.validation = ValidationResult(
+                    validation_result=False,
+                    justification="Validation result was not recorded after successful execution.",
+                )
+                _set_reliable_tool_context(
+                    current_context_variables, self._context_variables_key, final_tool_context_val
+                )
+
+            if final_tool_context_val.is_complete_and_successful:
+                is_successful_val = True
+                # latest_attempt must exist if is_complete_and_successful is true
+                # Re-fetch or assert to help Mypy understand it's not None
+                confirmed_latest_attempt = final_tool_context_val.latest_attempt
+                assert confirmed_latest_attempt is not None, (
+                    "Internal logic error: is_complete_and_successful is True but latest_attempt is None"
+                )
+                successful_params_val = SuccessfulExecutionParameters(
+                    attempt_args=confirmed_latest_attempt.attempt_args,
+                    attempt_kwargs=confirmed_latest_attempt.attempt_kwargs,
+                )
+            else:
+                failure_reason_val = final_tool_context_val.get_failure_summary()
+
+        except ReliableToolError as e:
+            is_successful_val = False
+            failure_reason_val = f"ReliableTool execution failed: {e}"
+            logger.warning("[%s] %s", self.name, failure_reason_val)  # Log the failure reason from ReliableToolError
+            final_tool_context_val = e.final_context or final_tool_context_val  # Use context from error if available
+            if not final_tool_context_val.attempts:  # Ensure some attempt is logged if context is minimal
+                final_tool_context_val.attempts.append(ExecutionAttempt(error=str(e)))
+
+        except (KeyError, ValueError, TypeError) as e_ctx_final:  # Context errors after chat
+            is_successful_val = False
+            failure_reason_val = f"Critical error involving context after chat: {e_ctx_final}"
+            logger.error("[%s] %s", self.name, failure_reason_val, exc_info=True)
+            try:  # Try to get the latest context, otherwise use what we had
+                final_tool_context_val = _get_reliable_tool_context(
+                    current_context_variables, self._context_variables_key
+                )
+            except (
+                Exception
+            ):  # If still fails, final_tool_context_val remains as tool_context_for_run or from a prior partial update
+                if not final_tool_context_val.attempts or final_tool_context_val.attempts[-1].error is None:
+                    final_tool_context_val.attempts.append(ExecutionAttempt(error=failure_reason_val))
+
+        except Exception as e_unexp:  # Unexpected errors during the process
+            is_successful_val = False
+            failure_reason_val = f"Unexpected error during reliable execution: {e_unexp}"
+            logger.error("[%s] %s", self.name, failure_reason_val, exc_info=True)
+            try:  # Try to get the latest context
+                final_tool_context_val = _get_reliable_tool_context(
+                    current_context_variables, self._context_variables_key
+                )
+            except (
+                Exception
+            ):  # If still fails, final_tool_context_val remains as tool_context_for_run or from a prior partial update
+                if not final_tool_context_val.attempts or final_tool_context_val.attempts[-1].error is None:
+                    final_tool_context_val.attempts.append(ExecutionAttempt(error=failure_reason_val))
+
+        return ToolExecutionDetails(
+            task=task,
+            is_overall_successful=is_successful_val,
+            failure_reason=failure_reason_val,
+            successful_parameters=successful_params_val,
+            final_tool_context=final_tool_context_val,
+        )
+
+    def run_and_get_details(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> ToolExecutionDetails:
+        if self._is_original_func_async:
+            raise TypeError(
+                f"Synchronous 'run_and_get_details()' called for an async tool '{self.name}'. "
+                f"Use 'a_run_and_get_details()' instead."
+            )
+        return self._process_run_with_details(
+            task=task,
+            context_variables=context_variables,
+            validation_prompt_addition=validation_prompt_addition,
+            messages=messages,
+            ground_truth=ground_truth,
+        )
+
+    async def a_run_and_get_details(
+        self,
+        task: str,
+        context_variables: Optional[ContextVariables] = None,
+        validation_prompt_addition: Optional[str] = None,
+        messages: Optional[list[dict[str, Any]]] = None,
+        ground_truth: Optional[List[str]] = None,
+    ) -> ToolExecutionDetails:
+        if not self._is_original_func_async:
+            warnings.warn(
+                f"Running sync function '{self._original_func_name}' (wrapped by ReliableTool '{self.name}') "
+                f"asynchronously using 'a_run_and_get_details()'. The underlying execution will be synchronous "
+                f"within an executor.",
+                UserWarning,
+            )
+
+        loop = asyncio.get_running_loop()
+        try:
+            func_call = functools.partial(
+                self._process_run_with_details,
+                task=task,
+                context_variables=context_variables,
+                validation_prompt_addition=validation_prompt_addition,
+                messages=messages,
+                ground_truth=ground_truth,
+            )
+            details: ToolExecutionDetails = await loop.run_in_executor(None, func_call)
+            return details
+        except Exception as e:
+            logger.critical(
+                "[%s] a_run_and_get_details encountered an unhandled exception from executor: %s",
+                self.name,
+                e,
+                exc_info=True,
+            )
+            fallback_ctx = ReliableToolContext(task=task, reliable_tool_name=self.name)
+            fallback_ctx.attempts.append(
+                ExecutionAttempt(error=f"Unhandled executor/process error: {type(e).__name__}: {e}")
+            )
+            return ToolExecutionDetails(
+                task=task,
+                is_overall_successful=False,
+                failure_reason=f"Critical unhandled exception during async execution: {type(e).__name__}: {e}",
+                final_tool_context=fallback_ctx,
+            )
diff --git a/mm_agents/coact/autogen/tools/experimental/tavily/__init__.py b/mm_agents/coact/autogen/tools/experimental/tavily/__init__.py
new file mode 100644
index 0000000..aec8614
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/tavily/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .tavily_search import TavilySearchTool
+
+__all__ = ["TavilySearchTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/tavily/tavily_search.py b/mm_agents/coact/autogen/tools/experimental/tavily/tavily_search.py
new file mode 100644
index 0000000..030e252
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/tavily/tavily_search.py
@@ -0,0 +1,183 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+import os
+from typing import Annotated, Any, Optional, Union
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ....llm_config import LLMConfig
+from ... import Depends, Tool
+from ...dependency_injection import on
+
+with optional_import_block():
+    from tavily import TavilyClient
+
+
+@require_optional_import(
+    [
+        "tavily",
+    ],
+    "tavily",
+)
+def _execute_tavily_query(
+    query: str,
+    tavily_api_key: str,
+    search_depth: str = "basic",
+    topic: str = "general",
+    include_answer: str = "basic",
+    include_raw_content: bool = False,
+    include_domains: list[str] = [],
+    num_results: int = 5,
+) -> Any:
+    """
+    Execute a search query using the Tavily API.
+
+    Args:
+        query (str): The search query string.
+        tavily_api_key (str): The API key for Tavily.
+        search_depth (str, optional): The depth of the search ('basic' or 'advanced'). Defaults to "basic".
+        topic (str, optional): The topic of the search. Defaults to "general".
+        include_answer (str, optional): Whether to include an AI-generated answer ('basic' or 'advanced'). Defaults to "basic".
+        include_raw_content (bool, optional): Whether to include raw content in the results. Defaults to False.
+        include_domains (list[str], optional): A list of domains to include in the search. Defaults to [].
+        num_results (int, optional): The maximum number of results to return. Defaults to 5.
+
+    Returns:
+        Any: The raw response object from the Tavily API client.
+    """
+    tavily_client = TavilyClient(api_key=tavily_api_key)
+    return tavily_client.search(
+        query=query,
+        search_depth=search_depth,
+        topic=topic,
+        include_answer=include_answer,
+        include_raw_content=include_raw_content,
+        include_domains=include_domains,
+        max_results=num_results,
+    )
+
+
+def _tavily_search(
+    query: str,
+    tavily_api_key: str,
+    search_depth: str = "basic",
+    topic: str = "general",
+    include_answer: str = "basic",
+    include_raw_content: bool = False,
+    include_domains: list[str] = [],
+    num_results: int = 5,
+) -> list[dict[str, Any]]:
+    """
+    Perform a Tavily search and format the results.
+
+    This function takes search parameters, executes the query using `_execute_tavily_query`,
+    and formats the results into a list of dictionaries containing title, link, and snippet.
+
+    Args:
+        query (str): The search query string.
+        tavily_api_key (str): The API key for Tavily.
+        search_depth (str, optional): The depth of the search ('basic' or 'advanced'). Defaults to "basic".
+        topic (str, optional): The topic of the search. Defaults to "general".
+        include_answer (str, optional): Whether to include an AI-generated answer ('basic' or 'advanced'). Defaults to "basic".
+        include_raw_content (bool, optional): Whether to include raw content in the results. Defaults to False.
+        include_domains (list[str], optional): A list of domains to include in the search. Defaults to [].
+        num_results (int, optional): The maximum number of results to return. Defaults to 5.
+
+    Returns:
+        list[dict[str, Any]]: A list of dictionaries, where each dictionary represents a search result
+            with keys 'title', 'link', and 'snippet'. Returns an empty list if no results are found.
+    """
+    res = _execute_tavily_query(
+        query=query,
+        tavily_api_key=tavily_api_key,
+        search_depth=search_depth,
+        topic=topic,
+        include_answer=include_answer,
+        include_raw_content=include_raw_content,
+        include_domains=include_domains,
+        num_results=num_results,
+    )
+
+    return [
+        {"title": item.get("title", ""), "link": item.get("url", ""), "snippet": item.get("content", "")}
+        for item in res.get("results", [])
+    ]
+
+
+@export_module("autogen.tools.experimental")
+class TavilySearchTool(Tool):
+    """
+    TavilySearchTool is a tool that uses the Tavily Search API to perform a search.
+
+    This tool allows agents to leverage the Tavily search engine for information retrieval.
+    It requires a Tavily API key, which can be provided during initialization or set as
+    an environment variable `TAVILY_API_KEY`.
+
+    Attributes:
+        tavily_api_key (str): The API key used for authenticating with the Tavily API.
+    """
+
+    def __init__(
+        self, *, llm_config: Optional[Union[LLMConfig, dict[str, Any]]] = None, tavily_api_key: Optional[str] = None
+    ):
+        """
+        Initializes the TavilySearchTool.
+
+        Args:
+            llm_config (Optional[Union[LLMConfig, dict[str, Any]]]): LLM configuration. (Currently unused but kept for potential future integration).
+            tavily_api_key (Optional[str]): The API key for the Tavily Search API. If not provided,
+                it attempts to read from the `TAVILY_API_KEY` environment variable.
+
+        Raises:
+            ValueError: If `tavily_api_key` is not provided either directly or via the environment variable.
+        """
+        self.tavily_api_key = tavily_api_key or os.getenv("TAVILY_API_KEY")
+
+        if self.tavily_api_key is None:
+            raise ValueError("tavily_api_key must be provided either as an argument or via TAVILY_API_KEY env var")
+
+        def tavily_search(
+            query: Annotated[str, "The search query."],
+            tavily_api_key: Annotated[Optional[str], Depends(on(self.tavily_api_key))],
+            search_depth: Annotated[Optional[str], "Either 'advanced' or 'basic'"] = "basic",
+            include_answer: Annotated[Optional[str], "Either 'advanced' or 'basic'"] = "basic",
+            include_raw_content: Annotated[Optional[bool], "Include the raw contents"] = False,
+            include_domains: Annotated[Optional[list[str]], "Specific web domains to search"] = [],
+            num_results: Annotated[int, "The number of results to return."] = 5,
+        ) -> list[dict[str, Any]]:
+            """
+            Performs a search using the Tavily API and returns formatted results.
+
+            Args:
+                query: The search query string.
+                tavily_api_key: The API key for Tavily (injected dependency).
+                search_depth: The depth of the search ('basic' or 'advanced'). Defaults to "basic".
+                include_answer: Whether to include an AI-generated answer ('basic' or 'advanced'). Defaults to "basic".
+                include_raw_content: Whether to include raw content in the results. Defaults to False.
+                include_domains: A list of domains to include in the search. Defaults to [].
+                num_results: The maximum number of results to return. Defaults to 5.
+
+            Returns:
+                A list of dictionaries, each containing 'title', 'link', and 'snippet' of a search result.
+
+            Raises:
+                ValueError: If the Tavily API key is not available.
+            """
+            if tavily_api_key is None:
+                raise ValueError("Tavily API key is missing.")
+            return _tavily_search(
+                query=query,
+                tavily_api_key=tavily_api_key,
+                search_depth=search_depth or "basic",
+                include_answer=include_answer or "basic",
+                include_raw_content=include_raw_content or False,
+                include_domains=include_domains or [],
+                num_results=num_results,
+            )
+
+        super().__init__(
+            name="tavily_search",
+            description="Use the Tavily Search API to perform a search.",
+            func_or_tool=tavily_search,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/web_search_preview/__init__.py b/mm_agents/coact/autogen/tools/experimental/web_search_preview/__init__.py
new file mode 100644
index 0000000..13c5855
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/web_search_preview/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .web_search_preview import WebSearchPreviewTool
+
+__all__ = ["WebSearchPreviewTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/web_search_preview/web_search_preview.py b/mm_agents/coact/autogen/tools/experimental/web_search_preview/web_search_preview.py
new file mode 100644
index 0000000..9c28e65
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/web_search_preview/web_search_preview.py
@@ -0,0 +1,114 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+
+import copy
+import logging
+import os
+from typing import Annotated, Any, Literal, Optional, Type, Union
+
+from pydantic import BaseModel
+
+from ....doc_utils import export_module
+from ....import_utils import optional_import_block, require_optional_import
+from ....llm_config import LLMConfig
+from ... import Tool
+
+with optional_import_block():
+    from openai import OpenAI
+    from openai.types.responses import WebSearchToolParam
+    from openai.types.responses.web_search_tool import UserLocation
+
+
+@require_optional_import("openai>=1.66.2", "openai")
+@export_module("autogen.tools.experimental")
+class WebSearchPreviewTool(Tool):
+    """WebSearchPreviewTool is a tool that uses OpenAI's web_search_preview tool to perform a search."""
+
+    def __init__(
+        self,
+        *,
+        llm_config: Union[LLMConfig, dict[str, Any]],
+        search_context_size: Literal["low", "medium", "high"] = "medium",
+        user_location: Optional[dict[str, str]] = None,
+        instructions: Optional[str] = None,
+        text_format: Optional[Type[BaseModel]] = None,
+    ):
+        """Initialize the WebSearchPreviewTool.
+
+        Args:
+            llm_config: The LLM configuration to use. This should be a dictionary
+                containing the model name and other parameters.
+            search_context_size: The size of the search context. One of `low`, `medium`, or `high`.
+                `medium` is the default.
+            user_location: The location of the user. This should be a dictionary containing
+                the city, country, region, and timezone.
+            instructions: Inserts a system (or developer) message as the first item in the model's context.
+            text_format: The format of the text to be returned. This should be a subclass of `BaseModel`.
+                The default is `None`, which means the text will be returned as a string.
+        """
+        self.web_search_tool_param = WebSearchToolParam(
+            type="web_search_preview",
+            search_context_size=search_context_size,
+            user_location=UserLocation(**user_location) if user_location else None,  # type: ignore[typeddict-item]
+        )
+        self.instructions = instructions
+        self.text_format = text_format
+
+        if isinstance(llm_config, LLMConfig):
+            llm_config = llm_config.model_dump()
+
+        llm_config = copy.deepcopy(llm_config)
+
+        if "config_list" not in llm_config:
+            raise ValueError("llm_config must contain 'config_list' key")
+
+        # Find first OpenAI model which starts with "gpt-4"
+        self.model = None
+        self.api_key = None
+        for model in llm_config["config_list"]:
+            if model["model"].startswith("gpt-4") and model.get("api_type", "openai") == "openai":
+                self.model = model["model"]
+                self.api_key = model.get("api_key", os.getenv("OPENAI_API_KEY"))
+                break
+        if self.model is None:
+            raise ValueError(
+                "No OpenAI model starting with 'gpt-4' found in llm_config, other models do not support web_search_preview"
+            )
+
+        if not self.model.startswith("gpt-4.1") and not self.model.startswith("gpt-4o-search-preview"):
+            logging.warning(
+                f"We recommend using a model starting with 'gpt-4.1' or 'gpt-4o-search-preview' for web_search_preview, but found {self.model}. "
+                "This may result in suboptimal performance."
+            )
+
+        def web_search_preview(
+            query: Annotated[str, "The search query. Add all relevant context to the query."],
+        ) -> Union[str, Optional[BaseModel]]:
+            client = OpenAI()
+
+            if not self.text_format:
+                response = client.responses.create(
+                    model=self.model,  # type: ignore[arg-type]
+                    tools=[self.web_search_tool_param],
+                    input=query,
+                    instructions=self.instructions,
+                )
+                return response.output_text
+
+            else:
+                response = client.responses.parse(
+                    model=self.model,  # type: ignore[arg-type]
+                    tools=[self.web_search_tool_param],
+                    input=query,
+                    instructions=self.instructions,
+                    text_format=self.text_format,
+                )
+                return response.output_parsed
+
+        super().__init__(
+            name="web_search_preview",
+            description="Tool used to perform a web search. It can be used as google search or directly searching a specific website.",
+            func_or_tool=web_search_preview,
+        )
diff --git a/mm_agents/coact/autogen/tools/experimental/wikipedia/__init__.py b/mm_agents/coact/autogen/tools/experimental/wikipedia/__init__.py
new file mode 100644
index 0000000..9f7a786
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/wikipedia/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from .wikipedia import WikipediaPageLoadTool, WikipediaQueryRunTool
+
+__all__ = ["WikipediaPageLoadTool", "WikipediaQueryRunTool"]
diff --git a/mm_agents/coact/autogen/tools/experimental/wikipedia/wikipedia.py b/mm_agents/coact/autogen/tools/experimental/wikipedia/wikipedia.py
new file mode 100644
index 0000000..0c5c829
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/experimental/wikipedia/wikipedia.py
@@ -0,0 +1,287 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Optional, Union
+
+import requests
+from pydantic import BaseModel
+
+from autogen.import_utils import optional_import_block, require_optional_import
+from autogen.tools import Tool
+
+with optional_import_block():
+    import wikipediaapi
+
+# Maximum allowed length for a query string.
+MAX_QUERY_LENGTH = 300
+# Maximum number of pages to retrieve from a search.
+MAX_PAGE_RETRIEVE = 100
+# Maximum number of characters to return from a Wikipedia page.
+MAX_ARTICLE_LENGTH = 10000
+
+
+class Document(BaseModel):
+    """Pydantic model representing a Wikipedia document.
+
+    Attributes:
+        page_content (str): Textual content of the Wikipedia page
+            (possibly truncated).
+        metadata (dict[str, str]): Additional info, including:
+            - source URL
+            - title
+            - pageid
+            - timestamp
+            - word count
+            - size
+    """
+
+    page_content: str
+    metadata: dict[str, str]
+
+
+class WikipediaClient:
+    """Client for interacting with the Wikipedia API.
+
+    Supports searching and page retrieval on a specified language edition.
+
+    Public methods:
+        search(query: str, limit: int) -> list[dict[str, Any]]
+        get_page(title: str) -> Optional[wikipediaapi.WikipediaPage]
+
+    Attributes:
+        base_url (str): URL of the MediaWiki API endpoint.
+        headers (dict[str, str]): HTTP headers, including User-Agent.
+        wiki (wikipediaapi.Wikipedia): Low-level Wikipedia API client.
+    """
+
+    def __init__(self, language: str = "en", tool_name: str = "wikipedia-client") -> None:
+        """Initialize the WikipediaClient.
+
+        Args:
+            language (str): ISO code of the Wikipedia edition (e.g., 'en', 'es').
+            tool_name (str): Identifier for User-Agent header.
+        """
+        self.base_url = f"https://{language}.wikipedia.org/w/api.php"
+        self.headers = {"User-Agent": f"autogen.Agent ({tool_name})"}
+        self.wiki = wikipediaapi.Wikipedia(
+            language=language,
+            extract_format=wikipediaapi.ExtractFormat.WIKI,
+            user_agent=f"autogen.Agent ({tool_name})",
+        )
+
+    def search(self, query: str, limit: int = 3) -> Any:
+        """Search Wikipedia for pages matching a query string.
+
+        Args:
+            query (str): The search keywords.
+            limit (int): Max number of results to return.
+
+        Returns:
+            list[dict[str, Any]]: Each dict has keys:
+                - 'title' (str)
+                - 'size' (int)
+                - 'wordcount' (int)
+                - 'timestamp' (str)
+
+        Raises:
+            requests.HTTPError: If the HTTP request to the API fails.
+        """
+        params = {
+            "action": "query",
+            "format": "json",
+            "list": "search",
+            "srsearch": query,
+            "srlimit": str(limit),
+            "srprop": "size|wordcount|timestamp",
+        }
+
+        response = requests.get(url=self.base_url, params=params, headers=self.headers)
+        response.raise_for_status()
+        data = response.json()
+        search_data = data.get("query", {}).get("search", [])
+        return search_data
+
+    def get_page(self, title: str) -> Optional[Any]:
+        """Retrieve a WikipediaPage object by title.
+
+        Args:
+            title (str): Title of the Wikipedia page.
+
+        Returns:
+            wikipediaapi.WikipediaPage | None: The page object if it exists,
+            otherwise None.
+
+        Raises:
+            wikipediaapi.WikipediaException: On lower‑level API errors.
+        """
+        page = self.wiki.page(title)
+        if not page.exists():
+            return None
+        return page
+
+
+@require_optional_import(["wikipediaapi"], "wikipedia")
+class WikipediaQueryRunTool(Tool):
+    """Tool for querying Wikipedia and returning summarized page results.
+
+    This tool uses the `wikipediaapi` package to perform searches
+    against a specified language edition of Wikipedia and returns
+    up to `top_k` page summaries.
+
+    Public methods:
+        query_run(query: str) -> list[str] | str
+
+    Attributes:
+        language (str): Language code for the Wikipedia edition (e.g., 'en', 'es').
+        top_k (int): Max number of page summaries returned (≤ MAX_PAGE_RETRIEVE).
+        verbose (bool): If True, enables debug logging to stdout.
+        wiki_cli (WikipediaClient): Internal client for Wikipedia API calls.
+    """
+
+    def __init__(self, language: str = "en", top_k: int = 3, verbose: bool = False) -> None:
+        """Initialize the WikipediaQueryRunTool.
+
+        Args:
+            language (str): ISO code of the Wikipedia edition to query.
+            top_k (int): Desired number of summaries (capped by MAX_PAGE_RETRIEVE).
+            verbose (bool): If True, print debug information during searches.
+        """
+        self.language = language
+        self.tool_name = "wikipedia-query-run"
+        self.wiki_cli = WikipediaClient(language, self.tool_name)
+        self.top_k = min(top_k, MAX_PAGE_RETRIEVE)
+        self.verbose = verbose
+        super().__init__(
+            name=self.tool_name,
+            description="Run a Wikipedia query and return page summaries.",
+            func_or_tool=self.query_run,
+        )
+
+    def query_run(self, query: str) -> Union[list[str], str]:
+        """Search Wikipedia and return formatted page summaries.
+
+        Truncates `query` to MAX_QUERY_LENGTH before searching.
+
+        Args:
+            query (str): Search term(s) to look up in Wikipedia.
+
+        Returns:
+            list[str]: Each element is "Page: <title>\nSummary: <text>".
+            str: Error message if no results are found or on exception.
+
+        Note:
+            Automatically handles API exceptions and returns error strings for robust operation
+        """
+        try:
+            if self.verbose:
+                print(f"INFO\t [{self.tool_name}] search query='{query[:MAX_QUERY_LENGTH]}' top_k={self.top_k}")
+            search_results = self.wiki_cli.search(query[:MAX_QUERY_LENGTH], limit=self.top_k)
+            summaries: list[str] = []
+            for item in search_results:
+                title = item["title"]
+                page = self.wiki_cli.get_page(title)
+                # Only format the summary if the page exists and has a summary.
+                if page is not None and page.summary:
+                    summary = f"Page: {title}\nSummary: {page.summary}"
+                    summaries.append(summary)
+            if not summaries:
+                return "No good Wikipedia Search Result was found"
+            return summaries
+        except Exception as e:
+            return f"wikipedia search failed: {str(e)}"
+
+
+@require_optional_import(["wikipediaapi"], "wikipedia")
+class WikipediaPageLoadTool(Tool):
+    """
+    A tool to load up to N characters of Wikipedia page content along with metadata.
+
+    This tool uses a language-specific Wikipedia client to search for relevant articles
+    and returns a list of Document objects containing truncated page content and metadata
+    (source URL, title, page ID, timestamp, word count, and size). Ideal for agents
+    requiring structured Wikipedia data for research, summarization, or contextual enrichment.
+
+    Attributes:
+        language (str): Wikipedia language code (default: "en").
+        top_k (int): Maximum number of pages to retrieve per query (default: 3).
+        truncate (int): Maximum number of characters of content per page (default: 4000).
+        verbose (bool): If True, prints debug information (default: False).
+        tool_name (str): Identifier used in User-Agent header.
+        wiki_cli (WikipediaClient): Client for interacting with the Wikipedia API.
+    """
+
+    def __init__(self, language: str = "en", top_k: int = 3, truncate: int = 4000, verbose: bool = False) -> None:
+        """
+        Initializes the WikipediaPageLoadTool with configurable language, result count, and content length.
+
+        Args:
+            language (str): The language code for the Wikipedia edition (default is "en").
+            top_k (int): The maximum number of pages to retrieve per query (default is 3;
+                         capped at MAX_PAGE_RETRIEVE).
+            truncate (int): The maximum number of characters to extract from each page (default is 4000;
+                            capped at MAX_ARTICLE_LENGTH).
+            verbose (bool): If True, enables verbose/debug logging (default is False).
+        """
+        self.language = language
+        self.top_k = min(top_k, MAX_PAGE_RETRIEVE)
+        self.truncate = min(truncate, MAX_ARTICLE_LENGTH)
+        self.verbose = verbose
+        self.tool_name = "wikipedia-page-load"
+        self.wiki_cli = WikipediaClient(language, self.tool_name)
+        super().__init__(
+            name=self.tool_name,
+            description=(
+                "Search Wikipedia for relevant pages using a language-specific client. "
+                "Returns a list of documents with truncated content and metadata including title, URL, "
+                "page ID, timestamp, word count, and page size. Configure number of results with the 'top_k' parameter "
+                "and content length with 'truncate'. Useful for research, summarization, or contextual enrichment."
+            ),
+            func_or_tool=self.content_search,
+        )
+
+    def content_search(self, query: str) -> Union[list[Document], str]:
+        """
+        Executes a Wikipedia search and returns page content plus metadata.
+
+        Args:
+            query (str): The search term to query Wikipedia.
+
+        Returns:
+            Union[list[Document], str]:
+                - list[Document]: Documents with up to `truncate` characters of page text
+                  and metadata if pages are found.
+                - str: Error message if the search fails or no pages are found.
+
+        Notes:
+            - Errors are caught internally and returned as strings.
+            - If no matching pages have text content, returns
+              "No good Wikipedia Search Result was found".
+        """
+        try:
+            if self.verbose:
+                print(f"INFO\t [{self.tool_name}] search query='{query[:MAX_QUERY_LENGTH]}' top_k={self.top_k}")
+            search_results = self.wiki_cli.search(query[:MAX_QUERY_LENGTH], limit=self.top_k)
+            docs: list[Document] = []
+            for item in search_results:
+                page = self.wiki_cli.get_page(item["title"])
+                # Only process pages that exist and have text content.
+                if page is not None and page.text:
+                    document = Document(
+                        page_content=page.text[: self.truncate],
+                        metadata={
+                            "source": f"https://{self.language}.wikipedia.org/?curid={item['pageid']}",
+                            "title": item["title"],
+                            "pageid": str(item["pageid"]),
+                            "timestamp": str(item["timestamp"]),
+                            "wordcount": str(item["wordcount"]),
+                            "size": str(item["size"]),
+                        },
+                    )
+                    docs.append(document)
+            if not docs:
+                return "No good Wikipedia Search Result was found"
+            return docs
+
+        except Exception as e:
+            return f"wikipedia search failed: {str(e)}"
diff --git a/mm_agents/coact/autogen/tools/function_utils.py b/mm_agents/coact/autogen/tools/function_utils.py
new file mode 100644
index 0000000..da8d9f0
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/function_utils.py
@@ -0,0 +1,411 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+import functools
+import inspect
+import json
+from logging import getLogger
+from typing import Annotated, Any, Callable, ForwardRef, Optional, TypeVar, Union
+
+from packaging.version import parse
+from pydantic import BaseModel, Field, TypeAdapter
+from pydantic import __version__ as pydantic_version
+from pydantic.json_schema import JsonSchemaValue
+from typing_extensions import Literal, get_args, get_origin
+
+from ..doc_utils import export_module
+from .dependency_injection import Field as AG2Field
+
+if parse(pydantic_version) < parse("2.10.2"):
+    from pydantic._internal._typing_extra import eval_type_lenient as try_eval_type
+else:
+    from pydantic._internal._typing_extra import try_eval_type
+
+
+__all__ = ["get_function_schema", "load_basemodels_if_needed", "serialize_to_str"]
+
+logger = getLogger(__name__)
+
+T = TypeVar("T")
+
+
+def get_typed_annotation(annotation: Any, globalns: dict[str, Any]) -> Any:
+    """Get the type annotation of a parameter.
+
+    Args:
+        annotation: The annotation of the parameter
+        globalns: The global namespace of the function
+
+    Returns:
+        The type annotation of the parameter
+    """
+    if isinstance(annotation, AG2Field):
+        annotation = annotation.description
+    if isinstance(annotation, str):
+        annotation = ForwardRef(annotation)
+        annotation, _ = try_eval_type(annotation, globalns, globalns)
+    return annotation
+
+
+def get_typed_signature(call: Callable[..., Any]) -> inspect.Signature:
+    """Get the signature of a function with type annotations.
+
+    Args:
+        call: The function to get the signature for
+
+    Returns:
+        The signature of the function with type annotations
+    """
+    signature = inspect.signature(call)
+    globalns = getattr(call, "__globals__", {})
+    typed_params = [
+        inspect.Parameter(
+            name=param.name,
+            kind=param.kind,
+            default=param.default,
+            annotation=get_typed_annotation(param.annotation, globalns),
+        )
+        for param in signature.parameters.values()
+    ]
+    typed_signature = inspect.Signature(typed_params)
+    return typed_signature
+
+
+def get_typed_return_annotation(call: Callable[..., Any]) -> Any:
+    """Get the return annotation of a function.
+
+    Args:
+        call: The function to get the return annotation for
+
+    Returns:
+        The return annotation of the function
+    """
+    signature = inspect.signature(call)
+    annotation = signature.return_annotation
+
+    if annotation is inspect.Signature.empty:
+        return None
+
+    globalns = getattr(call, "__globals__", {})
+    return get_typed_annotation(annotation, globalns)
+
+
+def get_param_annotations(typed_signature: inspect.Signature) -> dict[str, Union[Annotated[type[Any], str], type[Any]]]:
+    """Get the type annotations of the parameters of a function
+
+    Args:
+        typed_signature: The signature of the function with type annotations
+
+    Returns:
+        A dictionary of the type annotations of the parameters of the function
+    """
+    return {
+        k: v.annotation for k, v in typed_signature.parameters.items() if v.annotation is not inspect.Signature.empty
+    }
+
+
+class Parameters(BaseModel):
+    """Parameters of a function as defined by the OpenAI API"""
+
+    type: Literal["object"] = "object"
+    properties: dict[str, JsonSchemaValue]
+    required: list[str]
+
+
+class Function(BaseModel):
+    """A function as defined by the OpenAI API"""
+
+    description: Annotated[str, Field(description="Description of the function")]
+    name: Annotated[str, Field(description="Name of the function")]
+    parameters: Annotated[Parameters, Field(description="Parameters of the function")]
+
+
+class ToolFunction(BaseModel):
+    """A function under tool as defined by the OpenAI API."""
+
+    type: Literal["function"] = "function"
+    function: Annotated[Function, Field(description="Function under tool")]
+
+
+def get_parameter_json_schema(k: str, v: Any, default_values: dict[str, Any]) -> JsonSchemaValue:
+    """Get a JSON schema for a parameter as defined by the OpenAI API
+
+    Args:
+        k: The name of the parameter
+        v: The type of the parameter
+        default_values: The default values of the parameters of the function
+
+    Returns:
+        A Pydanitc model for the parameter
+    """
+
+    def type2description(k: str, v: Union[Annotated[type[Any], str], type[Any]]) -> str:
+        if not hasattr(v, "__metadata__"):
+            return k
+
+        # handles Annotated
+        retval = v.__metadata__[0]
+        if isinstance(retval, AG2Field):
+            return retval.description  # type: ignore[return-value]
+        else:
+            raise ValueError(f"Invalid {retval} for parameter {k}, should be a DescriptionField, got {type(retval)}")
+
+    schema = TypeAdapter(v).json_schema()
+    if k in default_values:
+        dv = default_values[k]
+        schema["default"] = dv
+
+    schema["description"] = type2description(k, v)
+
+    return schema
+
+
+def get_required_params(typed_signature: inspect.Signature) -> list[str]:
+    """Get the required parameters of a function
+
+    Args:
+        typed_signature: The signature of the function as returned by inspect.signature
+
+    Returns:
+        A list of the required parameters of the function
+    """
+    return [k for k, v in typed_signature.parameters.items() if v.default == inspect.Signature.empty]
+
+
+def get_default_values(typed_signature: inspect.Signature) -> dict[str, Any]:
+    """Get default values of parameters of a function
+
+    Args:
+        typed_signature: The signature of the function as returned by inspect.signature
+
+    Returns:
+        A dictionary of the default values of the parameters of the function
+    """
+    return {k: v.default for k, v in typed_signature.parameters.items() if v.default != inspect.Signature.empty}
+
+
+def get_parameters(
+    required: list[str],
+    param_annotations: dict[str, Union[Annotated[type[Any], str], type[Any]]],
+    default_values: dict[str, Any],
+) -> Parameters:
+    """Get the parameters of a function as defined by the OpenAI API
+
+    Args:
+        required: The required parameters of the function
+        param_annotations: The type annotations of the parameters of the function
+        default_values: The default values of the parameters of the function
+
+    Returns:
+        A Pydantic model for the parameters of the function
+    """
+    return Parameters(
+        properties={
+            k: get_parameter_json_schema(k, v, default_values)
+            for k, v in param_annotations.items()
+            if v is not inspect.Signature.empty
+        },
+        required=required,
+    )
+
+
+def get_missing_annotations(typed_signature: inspect.Signature, required: list[str]) -> tuple[set[str], set[str]]:
+    """Get the missing annotations of a function
+
+    Ignores the parameters with default values as they are not required to be annotated, but logs a warning.
+
+    Args:
+        typed_signature: The signature of the function with type annotations
+        required: The required parameters of the function
+
+    Returns:
+        A set of the missing annotations of the function
+    """
+    all_missing = {k for k, v in typed_signature.parameters.items() if v.annotation is inspect.Signature.empty}
+    missing = all_missing.intersection(set(required))
+    unannotated_with_default = all_missing.difference(missing)
+    return missing, unannotated_with_default
+
+
+@export_module("autogen.tools")
+def get_function_schema(f: Callable[..., Any], *, name: Optional[str] = None, description: str) -> dict[str, Any]:
+    """Get a JSON schema for a function as defined by the OpenAI API
+
+    Args:
+        f: The function to get the JSON schema for
+        name: The name of the function
+        description: The description of the function
+
+    Returns:
+        A JSON schema for the function
+
+    Raises:
+        TypeError: If the function is not annotated
+
+    Examples:
+    ```python
+    def f(a: Annotated[str, "Parameter a"], b: int = 2, c: Annotated[float, "Parameter c"] = 0.1) -> None:
+        pass
+
+
+    get_function_schema(f, description="function f")
+
+    #   {'type': 'function',
+    #    'function': {'description': 'function f',
+    #        'name': 'f',
+    #        'parameters': {'type': 'object',
+    #           'properties': {'a': {'type': 'str', 'description': 'Parameter a'},
+    #               'b': {'type': 'int', 'description': 'b'},
+    #               'c': {'type': 'float', 'description': 'Parameter c'}},
+    #           'required': ['a']}}}
+    ```
+
+    """
+    typed_signature = get_typed_signature(f)
+    required = get_required_params(typed_signature)
+    default_values = get_default_values(typed_signature)
+    param_annotations = get_param_annotations(typed_signature)
+    return_annotation = get_typed_return_annotation(f)
+    missing, unannotated_with_default = get_missing_annotations(typed_signature, required)
+
+    if return_annotation is None:
+        logger.warning(
+            f"The return type of the function '{f.__name__}' is not annotated. Although annotating it is "
+            + "optional, the function should return either a string, a subclass of 'pydantic.BaseModel'."
+        )
+
+    if unannotated_with_default != set():
+        unannotated_with_default_s = [f"'{k}'" for k in sorted(unannotated_with_default)]
+        logger.warning(
+            f"The following parameters of the function '{f.__name__}' with default values are not annotated: "
+            + f"{', '.join(unannotated_with_default_s)}."
+        )
+
+    if missing != set():
+        missing_s = [f"'{k}'" for k in sorted(missing)]
+        raise TypeError(
+            f"All parameters of the function '{f.__name__}' without default values must be annotated. "
+            + f"The annotations are missing for the following parameters: {', '.join(missing_s)}"
+        )
+
+    fname = name if name else f.__name__
+
+    parameters = get_parameters(required, param_annotations, default_values=default_values)
+
+    function = ToolFunction(
+        function=Function(
+            description=description,
+            name=fname,
+            parameters=parameters,
+        )
+    )
+
+    return function.model_dump()
+
+
+def get_load_param_if_needed_function(t: Any) -> Optional[Callable[[dict[str, Any], type[BaseModel]], BaseModel]]:
+    """Get a function to load a parameter if it is a Pydantic model
+
+    Args:
+        t: The type annotation of the parameter
+
+    Returns:
+        A function to load the parameter if it is a Pydantic model, otherwise None
+
+    """
+    origin = get_origin(t)
+
+    if origin is Annotated:
+        args = get_args(t)
+        if args:
+            return get_load_param_if_needed_function(args[0])
+        else:
+            # Invalid Annotated usage
+            return None
+
+    # Handle generic types (list[str], dict[str,Any], Union[...], etc.) or where t is not a type at all
+    # This means it's not a BaseModel subclass
+    if origin is not None or not isinstance(t, type):
+        return None
+
+    def load_base_model(v: dict[str, Any], model_type: type[BaseModel]) -> BaseModel:
+        return model_type(**v)
+
+    # Check if it's a class and a subclass of BaseModel
+    if issubclass(t, BaseModel):
+        return load_base_model
+    else:
+        return None
+
+
+@export_module("autogen.tools")
+def load_basemodels_if_needed(func: Callable[..., Any]) -> Callable[..., Any]:
+    """A decorator to load the parameters of a function if they are Pydantic models
+
+    Args:
+        func: The function with annotated parameters
+
+    Returns:
+        A function that loads the parameters before calling the original function
+
+    """
+    # get the type annotations of the parameters
+    typed_signature = get_typed_signature(func)
+    param_annotations = get_param_annotations(typed_signature)
+
+    # get functions for loading BaseModels when needed based on the type annotations
+    kwargs_mapping_with_nones = {k: get_load_param_if_needed_function(t) for k, t in param_annotations.items()}
+
+    # remove the None values
+    kwargs_mapping = {k: f for k, f in kwargs_mapping_with_nones.items() if f is not None}
+
+    # a function that loads the parameters before calling the original function
+    @functools.wraps(func)
+    def _load_parameters_if_needed(*args: Any, **kwargs: Any) -> Any:
+        # load the BaseModels if needed
+        for k, f in kwargs_mapping.items():
+            kwargs[k] = f(kwargs[k], param_annotations[k])
+
+        # call the original function
+        return func(*args, **kwargs)
+
+    @functools.wraps(func)
+    async def _a_load_parameters_if_needed(*args: Any, **kwargs: Any) -> Any:
+        # load the BaseModels if needed
+        for k, f in kwargs_mapping.items():
+            kwargs[k] = f(kwargs[k], param_annotations[k])
+
+        # call the original function
+        return await func(*args, **kwargs)
+
+    if inspect.iscoroutinefunction(func):
+        return _a_load_parameters_if_needed
+    else:
+        return _load_parameters_if_needed
+
+
+class _SerializableResult(BaseModel):
+    result: Any
+
+
+@export_module("autogen.tools")
+def serialize_to_str(x: Any) -> str:
+    if isinstance(x, str):
+        return x
+    if isinstance(x, BaseModel):
+        return x.model_dump_json()
+
+    retval_model = _SerializableResult(result=x)
+    try:
+        return str(retval_model.model_dump()["result"])
+    except Exception:
+        pass
+
+    # try json.dumps() and then just return str(x) if that fails too
+    try:
+        return json.dumps(x, ensure_ascii=False)
+    except Exception:
+        return str(x)
diff --git a/mm_agents/coact/autogen/tools/tool.py b/mm_agents/coact/autogen/tools/tool.py
new file mode 100644
index 0000000..d887232
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/tool.py
@@ -0,0 +1,187 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import inspect
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+
+from ..doc_utils import export_module
+from ..tools.function_utils import get_function_schema
+from .dependency_injection import ChatContext, get_context_params, inject_params
+
+if TYPE_CHECKING:
+    from ..agentchat.conversable_agent import ConversableAgent
+
+__all__ = ["Tool", "tool"]
+
+
+@export_module("autogen.tools")
+class Tool:
+    """A class representing a Tool that can be used by an agent for various tasks.
+
+    This class encapsulates a tool with a name, description, and an executable function.
+    The tool can be registered with a ConversableAgent for use either with an LLM or for direct execution.
+
+    Attributes:
+        name (str): The name of the tool.
+        description (str): The description of the tool.
+        func_or_tool (Union[Tool, Callable[..., Any]]): The function or Tool instance to create a Tool from.
+        parameters_json_schema (Optional[ict[str, Any]]): A schema describing the parameters that the function accepts. If None, the schema will be generated from the function signature.
+    """
+
+    def __init__(
+        self,
+        *,
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+        func_or_tool: Union["Tool", Callable[..., Any]],
+        parameters_json_schema: Optional[dict[str, Any]] = None,
+    ) -> None:
+        """Create a new Tool object.
+
+        Args:
+            name (str): The name of the tool.
+            description (str): The description of the tool.
+            func_or_tool (Union[Tool, Callable[..., Any]]): The function or Tool instance to create a Tool from.
+            parameters_json_schema (Optional[dict[str, Any]]): A schema describing the parameters that the function accepts. If None, the schema will be generated from the function signature.
+        """
+        if isinstance(func_or_tool, Tool):
+            self._name: str = name or func_or_tool.name
+            self._description: str = description or func_or_tool.description
+            self._func: Callable[..., Any] = func_or_tool.func
+            self._chat_context_param_names: list[str] = func_or_tool._chat_context_param_names
+        elif inspect.isfunction(func_or_tool) or inspect.ismethod(func_or_tool):
+            self._chat_context_param_names = get_context_params(func_or_tool, subclass=ChatContext)
+            self._func = inject_params(func_or_tool)
+            self._name = name or func_or_tool.__name__
+            self._description = description or func_or_tool.__doc__ or ""
+        else:
+            raise ValueError(
+                f"Parameter 'func_or_tool' must be a function, method or a Tool instance, it is '{type(func_or_tool)}' instead."
+            )
+
+        self._func_schema = (
+            {
+                "type": "function",
+                "function": {
+                    "name": name,
+                    "description": description,
+                    "parameters": parameters_json_schema,
+                },
+            }
+            if parameters_json_schema
+            else None
+        )
+
+    @property
+    def name(self) -> str:
+        return self._name
+
+    @property
+    def description(self) -> str:
+        return self._description
+
+    @property
+    def func(self) -> Callable[..., Any]:
+        return self._func
+
+    def register_for_llm(self, agent: "ConversableAgent") -> None:
+        """Registers the tool for use with a ConversableAgent's language model (LLM).
+
+        This method registers the tool so that it can be invoked by the agent during
+        interactions with the language model.
+
+        Args:
+            agent (ConversableAgent): The agent to which the tool will be registered.
+        """
+        if self._func_schema:
+            agent.update_tool_signature(self._func_schema, is_remove=False)
+        else:
+            agent.register_for_llm()(self)
+
+    def register_for_execution(self, agent: "ConversableAgent") -> None:
+        """Registers the tool for direct execution by a ConversableAgent.
+
+        This method registers the tool so that it can be executed by the agent,
+        typically outside of the context of an LLM interaction.
+
+        Args:
+            agent (ConversableAgent): The agent to which the tool will be registered.
+        """
+        agent.register_for_execution()(self)
+
+    def register_tool(self, agent: "ConversableAgent") -> None:
+        """Register a tool to be both proposed and executed by an agent.
+
+        Equivalent to calling both `register_for_llm` and `register_for_execution` with the same agent.
+
+        Note: This will not make the agent recommend and execute the call in the one step. If the agent
+        recommends the tool, it will need to be the next agent to speak in order to execute the tool.
+
+        Args:
+            agent (ConversableAgent): The agent to which the tool will be registered.
+        """
+        self.register_for_llm(agent)
+        self.register_for_execution(agent)
+
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
+        """Execute the tool by calling its underlying function with the provided arguments.
+
+        Args:
+            *args: Positional arguments to pass to the tool
+            **kwargs: Keyword arguments to pass to the tool
+
+        Returns:
+            The result of executing the tool's function.
+        """
+        return self._func(*args, **kwargs)
+
+    @property
+    def tool_schema(self) -> dict[str, Any]:
+        """Get the schema for the tool.
+
+        This is the preferred way of handling function calls with OpeaAI and compatible frameworks.
+
+        """
+        return get_function_schema(self.func, name=self.name, description=self.description)
+
+    @property
+    def function_schema(self) -> dict[str, Any]:
+        """Get the schema for the function.
+
+        This is the old way of handling function calls with OpenAI and compatible frameworks.
+        It is provided for backward compatibility.
+
+        """
+        schema = get_function_schema(self.func, name=self.name, description=self.description)
+        return schema["function"]  # type: ignore[no-any-return]
+
+    @property
+    def realtime_tool_schema(self) -> dict[str, Any]:
+        """Get the schema for the tool.
+
+        This is the preferred way of handling function calls with OpeaAI and compatible frameworks.
+
+        """
+        schema = get_function_schema(self.func, name=self.name, description=self.description)
+        schema = {"type": schema["type"], **schema["function"]}
+
+        return schema
+
+
+@export_module("autogen.tools")
+def tool(name: Optional[str] = None, description: Optional[str] = None) -> Callable[[Callable[..., Any]], Tool]:
+    """Decorator to create a Tool from a function.
+
+    Args:
+        name (str): The name of the tool.
+        description (str): The description of the tool.
+
+    Returns:
+        Callable[[Callable[..., Any]], Tool]: A decorator that creates a Tool from a function.
+    """
+
+    def decorator(func: Callable[..., Any]) -> Tool:
+        return Tool(name=name, description=description, func_or_tool=func)
+
+    return decorator
diff --git a/mm_agents/coact/autogen/tools/toolkit.py b/mm_agents/coact/autogen/tools/toolkit.py
new file mode 100644
index 0000000..86aea36
--- /dev/null
+++ b/mm_agents/coact/autogen/tools/toolkit.py
@@ -0,0 +1,86 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import TYPE_CHECKING
+
+from ..doc_utils import export_module
+from .tool import Tool
+
+if TYPE_CHECKING:
+    from ..agentchat.conversable_agent import ConversableAgent
+
+__all__ = ["Toolkit"]
+
+
+@export_module("autogen.tools")
+class Toolkit:
+    """A class representing a set of tools that can be used by an agent for various tasks."""
+
+    def __init__(self, tools: list[Tool]) -> None:
+        """Create a new Toolkit object.
+
+        Args:
+            tools (list[Tool]): The list of tools in the
+        """
+        self.toolkit = {tool.name: tool for tool in tools}
+
+    @property
+    def tools(self) -> list[Tool]:
+        """Get the list of tools in the set."""
+        return list(self.toolkit.values())
+
+    def register_for_llm(self, agent: "ConversableAgent") -> None:
+        """Register the tools in the set with an LLM agent.
+
+        Args:
+            agent (ConversableAgent): The LLM agent to register the tools with.
+        """
+        for tool in self.toolkit.values():
+            tool.register_for_llm(agent)
+
+    def register_for_execution(self, agent: "ConversableAgent") -> None:
+        """Register the tools in the set with an agent for
+
+        Args:
+            agent (ConversableAgent): The agent to register the tools with.
+        """
+        for tool in self.toolkit.values():
+            tool.register_for_execution(agent)
+
+    def get_tool(self, tool_name: str) -> Tool:
+        """Get a tool from the set by name.
+
+        Args:
+            tool_name (str): The name of the tool to get.
+
+        Returns:
+            Tool: The tool with the given name.
+        """
+        if tool_name in self.toolkit:
+            return self.toolkit[tool_name]
+
+        raise ValueError(f"Tool '{tool_name}' not found in Toolkit.")
+
+    def set_tool(self, tool: Tool) -> None:
+        """Set a tool in the set.
+
+        Args:
+            tool (Tool): The tool to set.
+        """
+        self.toolkit[tool.name] = tool
+
+    def remove_tool(self, tool_name: str) -> None:
+        """Remove a tool from the set by name.
+
+        Args:
+            tool_name (str): The name of the tool to remove.
+        """
+        if tool_name in self.toolkit:
+            del self.toolkit[tool_name]
+        else:
+            raise ValueError(f"Tool '{tool_name}' not found in Toolkit.")
+
+    def __len__(self) -> int:
+        """Get the number of tools in the map."""
+        return len(self.toolkit)
diff --git a/mm_agents/coact/autogen/types.py b/mm_agents/coact/autogen/types.py
new file mode 100644
index 0000000..0fdc082
--- /dev/null
+++ b/mm_agents/coact/autogen/types.py
@@ -0,0 +1,29 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+# Portions derived from  https://github.com/microsoft/autogen are under the MIT License.
+# SPDX-License-Identifier: MIT
+
+from typing import Any, Literal, TypedDict, Union
+
+MessageContentType = Union[str, list[Union[dict[str, Any], str]], None]
+
+
+class UserMessageTextContentPart(TypedDict):
+    """Represents a text content part of a user message"""
+
+    type: Literal["text"]
+    """The type of the content part. Always "text" for text content parts."""
+    text: str
+    """The text content of the part."""
+
+
+class UserMessageImageContentPart(TypedDict):
+    """Represents an image content part of a user message"""
+
+    type: Literal["input_image"]
+    """The type of the content part. Always "input_image" for image content parts."""
+    # Ignoring the other "detail param for now"
+    image_url: str
+    """The URL of the image."""
diff --git a/mm_agents/coact/coding_agent.py b/mm_agents/coact/coding_agent.py
new file mode 100644
index 0000000..cfd8507
--- /dev/null
+++ b/mm_agents/coact/coding_agent.py
@@ -0,0 +1,78 @@
+from typing import Any, Callable, Optional
+from desktop_env.desktop_env import DesktopEnv
+
+from .autogen.llm_config import LLMConfig
+from .autogen.code_utils import PYTHON_VARIANTS
+from .autogen.agentchat.contrib.multimodal_conversable_agent import MultimodalConversableAgent
+
+
+CODER_SYSTEM_MESSAGE = """# Your role
+You are a coding assistant, you need to solve a task step-by-step given by the user. 
+You can write code in ```bash...``` code blocks for bash scripts, and ```python...``` code blocks for python code. 
+
+# Important notes
+- Once you complete the task, reply ONLY with "TERMINATE" to end the task.
+- DO NOT mix the TERMINATE with any other words or code blocks in your reply.
+- When you write code, you must identify the language (whether it is python or bash) of the code.
+- Your linux username is "user".
+- Wrap all your code in ONE code block. DO NOT let user save the code as a file and execute it for you.
+- If you want to use sudo, follow the format: "echo password | sudo -S [YOUR COMMANDS]" (no quotes for the word "password").
+- Ignore the error: "sudo: /etc/sudoers.d is world writable".
+- Your python code will be sent line-by-line into a interactive python terminal. Do not include __main__ in your code.
+- When import a package, you need to check if the package is installed. If not, you need to install it yourself.
+- You need to print the progressive and final result.
+- If you met execution error, you need to analyze the error message and try to fix the error.
+- IMPORTANT: If you modified a file like spreadsheet, you should close and reopen the file by operating the GUI, so that I can see what you changed.
+"""
+
+class TerminalProxyAgent(MultimodalConversableAgent):
+    def __init__(
+            self, 
+        name: str, 
+        env: DesktopEnv,
+        llm_config: LLMConfig = False, 
+        system_message: str = "",
+        human_input_mode: str = "NEVER",
+        code_execution_config = {},
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        default_auto_reply: Optional[str] = None,
+        description: Optional[str] = None,
+    ):
+        super().__init__(
+            name=name,
+            system_message=system_message,
+            is_termination_msg=is_termination_msg,
+            max_consecutive_auto_reply=max_consecutive_auto_reply,
+            human_input_mode=human_input_mode,
+            code_execution_config=code_execution_config,
+            llm_config=llm_config,
+            default_auto_reply=default_auto_reply,
+            description=description
+        )
+        self.env = env
+
+    def run_code(self, code: str, lang: str = "python", **kwargs):
+        exitcode = 1
+        logs = ""
+        image = None
+        if lang in ["bash", "shell", "sh"]:
+            output_dict = self.env.controller.run_bash_script(code)
+            if output_dict["status"] == "success":
+                exitcode = 0
+                logs = output_dict["output"]
+            else:
+                exitcode = -1
+                logs = output_dict["output"]
+        elif lang in PYTHON_VARIANTS:
+            output_dict = self.env.controller.run_python_script(code)
+            if output_dict["status"] == "error":
+                exitcode = -1
+                logs = output_dict["output"]
+            else:
+                exitcode = -1
+                logs = output_dict["message"]
+        else:
+            exitcode = -1
+            logs = f"unknown language {lang}"
+        return exitcode, logs, image
diff --git a/mm_agents/coact/cua_agent.py b/mm_agents/coact/cua_agent.py
new file mode 100644
index 0000000..d90e9d4
--- /dev/null
+++ b/mm_agents/coact/cua_agent.py
@@ -0,0 +1,328 @@
+import base64
+import json
+import logging
+import os
+import time
+from typing import Any, Dict, List, Tuple
+
+import openai
+from desktop_env.desktop_env import DesktopEnv
+from openai import OpenAI  # pip install --upgrade openai>=1.30
+
+logger = logging.getLogger("desktopenv")
+
+GPT4O_INPUT_PRICE_PER_1M_TOKENS = 3.00
+GPT4O_OUTPUT_PRICE_PER_1M_TOKENS = 12.00
+
+PROMPT_TEMPLATE = """# Task
+{instruction}
+
+# Hints
+- Sudo password is "password".
+- If you meet "Authentication required" dialog, enter the "password" to continue.
+- Do not close the any application or window or tab that is already opened.
+- Do not close the window at the end of the task.
+- If you have completed the user task, reply with the information you want the user to know along with 'TERMINATE'.
+""".strip()
+DEFAULT_REPLY = "Please continue the user task. If you have completed the user task, reply with the information you want the user to know along with 'TERMINATE'."
+
+
+def _cua_to_pyautogui(action) -> str:
+    """Convert an Action (dict **or** Pydantic model) into a pyautogui call."""
+    def fld(key: str, default: Any = None) -> Any:
+        return action.get(key, default) if isinstance(action, dict) else getattr(action, key, default)
+
+    act_type = fld("type")
+    if not isinstance(act_type, str):
+        act_type = str(act_type).split(".")[-1]
+    act_type = act_type.lower()
+
+    if act_type in ["click", "double_click"]:
+        button = fld('button', 'left')
+        if button == 1 or button == 'left':
+            button = 'left'
+        elif button == 2 or button == 'middle':
+            button = 'middle'
+        elif button == 3 or button == 'right':
+            button = 'right'
+
+        if act_type == "click":
+            return f"pyautogui.click({fld('x')}, {fld('y')}, button='{button}')"
+        if act_type == "double_click":
+            return f"pyautogui.doubleClick({fld('x')}, {fld('y')}, button='{button}')"
+        
+    if act_type == "scroll":
+        cmd = ""
+        if fld('scroll_y', 0) != 0:
+            cmd += f"pyautogui.scroll({-fld('scroll_y', 0) / 100}, x={fld('x', 0)}, y={fld('y', 0)});"
+        return cmd
+    if act_type == "drag":
+        path = fld('path', [{"x": 0, "y": 0}, {"x": 0, "y": 0}])
+        cmd = f"pyautogui.moveTo({path[0]['x']}, {path[0]['y']}, _pause=False); "
+        cmd += f"pyautogui.dragTo({path[1]['x']}, {path[1]['y']}, duration=0.5, button='left')"
+        return cmd
+
+    if act_type == 'move':
+        return f"pyautogui.moveTo({fld('x')}, {fld('y')})"
+
+    if act_type == "keypress":
+        keys = fld("keys", []) or [fld("key")]
+        if len(keys) == 1:
+            return f"pyautogui.press('{keys[0].lower()}')"
+        else:
+            return "pyautogui.hotkey('{}')".format("', '".join(keys)).lower()
+        
+    if act_type == "type":
+        text = str(fld("text", ""))
+        return "pyautogui.typewrite({:})".format(repr(text))
+    
+    if act_type == "wait":
+        return "WAIT"
+    
+    return "WAIT"  # fallback
+
+
+def _to_input_items(output_items: list) -> list:
+    """
+    Convert `response.output` into the JSON-serialisable items we're allowed
+    to resend in the next request.  We drop anything the CUA schema doesn't
+    recognise (e.g. `status`, `id`, …) and cap history length.
+    """
+    cleaned: List[Dict[str, Any]] = []
+
+    for item in output_items:
+        raw: Dict[str, Any] = item if isinstance(item, dict) else item.model_dump()
+
+        # ---- strip noisy / disallowed keys ---------------------------------
+        raw.pop("status", None)
+        cleaned.append(raw)
+
+    return cleaned  # keep just the most recent 50 items
+
+
+def call_openai_cua(client: OpenAI,
+                    history_inputs: list,
+                    screen_width: int = 1920,
+                    screen_height: int = 1080,
+                    environment: str = "linux") -> Tuple[Any, float]:
+    retry = 0
+    response = None
+    while retry < 3:
+        try:
+            response = client.responses.create(
+                model="computer-use-preview",
+                tools=[{
+                    "type": "computer_use_preview",
+                    "display_width": screen_width,
+                    "display_height": screen_height,
+                    "environment": environment,
+                }],
+                input=history_inputs,
+                reasoning={"summary": "concise"},
+                tool_choice="required",
+                truncation="auto",
+            )
+            break
+        except openai.BadRequestError as e:
+            retry += 1
+            logger.error(f"Error in response.create: {e}")
+            time.sleep(0.5)
+        except openai.InternalServerError as e:
+            retry += 1
+            logger.error(f"Error in response.create: {e}")
+            time.sleep(0.5)
+    if retry == 3:
+        raise Exception("Failed to call OpenAI.")
+
+    cost = 0.0
+    if response and hasattr(response, "usage") and response.usage:
+        input_tokens = response.usage.input_tokens
+        output_tokens = response.usage.output_tokens
+        input_cost = (input_tokens / 1_000_000) * GPT4O_INPUT_PRICE_PER_1M_TOKENS
+        output_cost = (output_tokens / 1_000_000) * GPT4O_OUTPUT_PRICE_PER_1M_TOKENS
+        cost = input_cost + output_cost
+
+    return response, cost
+
+
+def run_cua(
+    env: DesktopEnv,
+    instruction: str,
+    max_steps: int,
+    save_path: str = './',
+    screen_width: int = 1920,
+    screen_height: int = 1080,
+    sleep_after_execution: float = 0.3,
+    truncate_history_inputs: int = 100,
+) -> Tuple[str, float]:
+    client = OpenAI()
+
+    # 0 / reset & first screenshot
+    logger.info(f"Instruction: {instruction}")
+    obs = env.controller.get_screenshot()
+    screenshot_b64 = base64.b64encode(obs).decode("utf-8")
+    with open(os.path.join(save_path, "initial_screenshot.png"), "wb") as f:
+        f.write(obs)
+    history_inputs = [{
+        "role": "user",
+        "content": [
+            {"type": "input_text", "text": PROMPT_TEMPLATE.format(instruction=instruction)},
+            {"type": "input_image", "image_url": f"data:image/png;base64,{screenshot_b64}"},
+        ],
+    }]
+
+    response, cost = call_openai_cua(client, history_inputs, screen_width, screen_height)
+    total_cost = cost
+    logger.info(f"Cost: ${cost:.6f} | Total Cost: ${total_cost:.6f}")
+    step_no = 0
+    
+    reasoning_list = []
+    reasoning = ""
+
+    # 1 / iterative dialogue
+    while step_no < max_steps:
+        step_no += 1
+        history_inputs += _to_input_items(response.output)
+
+        # --- robustly pull out computer_call(s) ------------------------------
+        calls: List[Dict[str, Any]] = []
+        # completed = False
+        breakflag = False
+        for i, o in enumerate(response.output):
+            typ = o["type"] if isinstance(o, dict) else getattr(o, "type", None)
+            if not isinstance(typ, str):
+                typ = str(typ).split(".")[-1]
+            if typ == "computer_call":
+                calls.append(o if isinstance(o, dict) else o.model_dump())
+            elif typ == "reasoning" and len(o.summary) > 0:
+                reasoning = o.summary[0].text
+                reasoning_list.append(reasoning)
+                logger.info(f"[Reasoning]: {reasoning}")
+            elif typ == 'message':
+                if 'TERMINATE' in o.content[0].text:
+                    reasoning_list.append(f"Final output: {o.content[0].text}")
+                    reasoning = "My thinking process\n" + "\n- ".join(reasoning_list) + '\nPlease check the screenshot and see if it fulfills your requirements.'
+                    breakflag = True
+                    break
+                try:
+                    json.loads(o.content[0].text)
+                    history_inputs.pop(len(history_inputs) - len(response.output) + i)
+                    step_no -= 1
+                except Exception as e:
+                    logger.info(f"[Message]: {o.content[0].text}")
+                    if '?' in o.content[0].text:
+                        history_inputs += [{
+                            "role": "user",
+                            "content": [
+                                {"type": "input_text", "text": DEFAULT_REPLY},
+                            ],
+                        }]
+                    elif "{" in o.content[0].text and "}" in o.content[0].text:
+                        history_inputs.pop(len(history_inputs) - len(response.output) + i)
+                        step_no -= 1
+                    else:
+                        logger.info(f"[Message]: {o.content[0].text}")
+                        history_inputs.pop(len(history_inputs) - len(response.output) + i)
+                        reasoning = o.content[0].text
+                        reasoning_list.append(reasoning)
+                        step_no -= 1
+
+        if breakflag:
+            break
+
+        for action_call in calls:
+            py_cmd = _cua_to_pyautogui(action_call["action"])
+
+            # --- execute in VM ---------------------------------------------------
+            obs, *_ = env.step(py_cmd, sleep_after_execution)
+
+            # --- send screenshot back -------------------------------------------
+            screenshot_b64 = base64.b64encode(obs["screenshot"]).decode("utf-8")
+            with open(os.path.join(save_path, f"step_{step_no}.png"), "wb") as f:
+                f.write(obs["screenshot"])
+            history_inputs += [{
+                "type": "computer_call_output",
+                "call_id": action_call["call_id"],
+                "output": {
+                    "type": "computer_screenshot",
+                    "image_url": f"data:image/png;base64,{screenshot_b64}",
+                },
+            }]
+            if "pending_safety_checks" in action_call and len(action_call.get("pending_safety_checks", [])) > 0:
+                history_inputs[-1]['acknowledged_safety_checks'] = [
+                    {
+                        "id": psc["id"],
+                        "code": psc["code"],
+                        "message": "Please acknowledge this warning if you'd like to proceed."
+                    }
+                    for psc in action_call.get("pending_safety_checks", [])
+                ]
+        
+        # truncate history inputs while preserving call_id pairs
+        if len(history_inputs) > truncate_history_inputs:
+            original_history = history_inputs[:]
+            history_inputs = [history_inputs[0]] + history_inputs[-truncate_history_inputs:]
+            
+            # Find all call_ids in the truncated history
+            call_ids_in_truncated = set()
+            for item in history_inputs:
+                if isinstance(item, dict) and 'call_id' in item:
+                    call_ids_in_truncated.add(item['call_id'])
+            
+            # Check if any call_ids are missing their pairs
+            call_id_types = {}  # call_id -> list of types that reference it
+            for item in history_inputs:
+                if isinstance(item, dict) and 'call_id' in item:
+                    call_id = item['call_id']
+                    item_type = item.get('type', '')
+                    if call_id not in call_id_types:
+                        call_id_types[call_id] = []
+                    call_id_types[call_id].append(item_type)
+            
+            # Find unpaired call_ids (should have both computer_call and computer_call_output)
+            unpaired_call_ids = []
+            for call_id, types in call_id_types.items():
+                # Check if we have both call and output
+                has_call = 'computer_call' in types
+                has_output = 'computer_call_output' in types
+                if not (has_call and has_output):
+                    unpaired_call_ids.append(call_id)
+            
+            # Add missing pairs from original history while preserving order
+            if unpaired_call_ids:
+                # Find missing paired items in their original order
+                missing_items = []
+                for item in original_history:
+                    if (isinstance(item, dict) and 
+                        item.get('call_id') in unpaired_call_ids and 
+                        item not in history_inputs):
+                        missing_items.append(item)
+                
+                # Insert missing items back, preserving their original order
+                # We need to find appropriate insertion points to maintain chronology
+                for missing_item in missing_items:
+                    # Find the best insertion point based on original history order
+                    original_index = original_history.index(missing_item)
+                    
+                    # Find insertion point in truncated history
+                    insert_pos = len(history_inputs)  # default to end
+                    for i, existing_item in enumerate(history_inputs[1:], 1):  # skip first item (initial prompt)
+                        if existing_item in original_history:
+                            existing_original_index = original_history.index(existing_item)
+                            if existing_original_index > original_index:
+                                insert_pos = i
+                                break
+                    
+                    history_inputs.insert(insert_pos, missing_item)
+
+        response, cost = call_openai_cua(client, history_inputs, screen_width, screen_height)
+        total_cost += cost
+        logger.info(f"Cost: ${cost:.6f} | Total Cost: ${total_cost:.6f}")
+    
+    logger.info(f"Total cost for the task: ${total_cost:.4f}")
+    history_inputs[0]['content'][1]['image_url'] = "<image>"
+    for item in history_inputs:
+        if item.get('type', None) == 'computer_call_output':
+            item['output']['image_url'] = "<image>"
+    return history_inputs, reasoning, total_cost
+
diff --git a/mm_agents/coact/operator_agent.py b/mm_agents/coact/operator_agent.py
new file mode 100644
index 0000000..e300ffd
--- /dev/null
+++ b/mm_agents/coact/operator_agent.py
@@ -0,0 +1,305 @@
+# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
+#
+# SPDX-License-Identifier: Apache-2.0
+import base64
+import json
+import os
+import traceback
+from typing import Any, Callable, Literal, Optional, Union
+from desktop_env.desktop_env import DesktopEnv
+
+from .autogen.llm_config import LLMConfig
+from .autogen.agentchat.conversable_agent import ConversableAgent
+from .autogen.agentchat.contrib.multimodal_conversable_agent import MultimodalConversableAgent
+
+from .cua_agent import run_cua
+from .coding_agent import TerminalProxyAgent, CODER_SYSTEM_MESSAGE
+
+
+class OrchestratorAgent(MultimodalConversableAgent):
+    """(In preview) Captain agent, designed to solve a task with an agent or a group of agents."""
+
+    CALL_GUI_AGENT_TOOL = {
+        "type": "function",
+        "function": {
+            "name": "call_gui_agent",
+            "description": """Let a GUI agent to solve a task. GUI agent can operate the computer by clicking and typing. Require detailed task description.""",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "task": {
+                        "type": "string",
+                        "description": "[REQUIRED] A detailed task to be solved.",
+                    },
+                },
+            },
+        },
+    }
+
+    CALL_CODING_AGENT_TOOL = {
+        "type": "function",
+        "function": {
+            "name": "call_coding_agent",
+            "description": """Let a coding agent to solve a task. Coding agent can write python and bash code with many tools to solve a task. Especially good for file (like spreadsheet) operation. Require detailed task and environment description.""",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "task": {
+                        "type": "string",
+                        "description": "[REQUIRED] A detailed task to be solved. The task should be a coding task.",
+                    },
+                    "environment": {
+                        "type": "string",
+                        "description": "[REQUIRED] The environment description of the coding agent. It should be a detailed description of the system state, including the current directory, the opened files, the running processes, etc.",
+                    }
+                },
+            },
+        },
+    }
+
+    CALL_API_SUMMARY_AGENT_TOOL = {
+        "type": "function",
+        "function": {
+            "name": "call_api_summary_agent",
+            "description": """Let a API summary agent to summarize the API response. API summary agent can summarize the API response. Require detailed API response.""",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "url": {"type": "string", "description": "[REQUIRED] A url of the API response."},
+                },
+            },
+        },
+    }
+
+    DEFAULT_DESCRIPTION = ""
+
+    # This is used to prompt the LLM to summarize the conversation history between CaptainAgent's tool execution history
+    DEFAULT_SUMMARY_PROMPT = "Read the following conversation history between an expert and a group of agent experts, summarize the conversation history. Your summarization should include the initial task, the experts' plan and the attempt, finally the results of the conversation. If the experts arrived at a conclusion, state it as it is without any modification."
+
+    def __init__(
+        self,
+        name: str,
+        system_message: Optional[str] = None,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = None,
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        human_input_mode: Optional[str] = "NEVER",
+        code_execution_config: Optional[Union[dict[str, Any], Literal[False]]] = False,
+        description: Optional[str] = DEFAULT_DESCRIPTION,
+        **kwargs: Any,
+    ):
+        super().__init__(
+            name,
+            is_termination_msg=is_termination_msg,
+            max_consecutive_auto_reply=max_consecutive_auto_reply,
+            human_input_mode=human_input_mode,
+            code_execution_config=code_execution_config,
+            llm_config=llm_config,
+            description=description,
+            **kwargs,
+        )
+
+        if system_message is None:
+            self.update_system_message("")
+
+        self.update_tool_signature(self.CALL_CODING_AGENT_TOOL, is_remove=False)
+        self.update_tool_signature(self.CALL_GUI_AGENT_TOOL, is_remove=False)
+        # self.assistant.update_tool_signature(self.CALL_API_SUMMARY_AGENT_TOOL, is_remove=False)  # TODO: add this tool later
+
+
+class OrchestratorUserProxyAgent(MultimodalConversableAgent):
+    """(In preview) A proxy agent for the captain agent, that can execute code and provide feedback to the other agents."""
+
+    DEFAULT_AUTO_REPLY = "I'm a proxy and I can only execute your tool or end the conversation. If you think the problem is solved, please reply me only with 'TERMINATE'. If you think the task is impossible to solve, please reply me only with 'INFEASIBLE'."
+
+    DEFAULT_USER_PROXY_AGENT_DESCRIPTIONS = {
+        "ALWAYS": "An attentive HUMAN user who can answer questions about the task, and can perform tasks such as running Python code or inputting command line commands at a Linux terminal and reporting back the execution results.",
+        "TERMINATE": "A user that can run Python code or input command line commands at a Linux terminal and report back the execution results.",
+        "NEVER": "A computer terminal that can running Python scripts (provided to it quoted in ```python code blocks), or sh shell scripts (provided to it quoted in ```sh code blocks), or the conversation history and result of a group of agents",
+    }
+
+    CONVERSATION_REVIEW_PROMPT = """You are looking for a conversation history between a user and an agent.
+    Given the conversation history below, summarize the conversation history in a concise way.
+
+    - Conversation history:
+    {chat_history}
+
+    - Response template (markdown format):
+    # Summarize of the conversation history
+    ...(include the middle terminal output. They are important.)
+
+    # Final result
+    ...
+    """
+
+    def __init__(
+        self,
+        name: str,
+        is_termination_msg: Optional[Callable[[dict[str, Any]], bool]] = None,
+        max_consecutive_auto_reply: Optional[int] = None,
+        human_input_mode: Optional[str] = "NEVER",
+        code_execution_config: Optional[Union[dict[str, Any], Literal[False]]] = {},
+        default_auto_reply: Optional[Union[str, dict[str, Any]]] = DEFAULT_AUTO_REPLY,
+        llm_config: Optional[Union[LLMConfig, dict[str, Any], Literal[False]]] = False,
+        system_message: Optional[Union[str, list]] = "",
+        description: Optional[str] = None,
+
+        # GUI Agent config
+        provider_name: str = "docker",
+        path_to_vm: str = None,
+        observation_type: str = "screenshot",
+        screen_width: int = 1920,
+        screen_height: int = 1080,
+        sleep_after_execution: float = 1.0,
+        truncate_history_inputs: int = 51,
+        cua_max_steps: int = 50,
+        coding_max_steps: int = 30,
+        history_save_dir: str = "",
+        llm_model: str = "o4-mini",
+    ):
+        description = (
+            description if description is not None else self.DEFAULT_USER_PROXY_AGENT_DESCRIPTIONS[human_input_mode]
+        )
+        super().__init__(
+            name=name,
+            system_message=system_message,
+            is_termination_msg=is_termination_msg,
+            max_consecutive_auto_reply=max_consecutive_auto_reply,
+            human_input_mode=human_input_mode,
+            code_execution_config=code_execution_config,
+            llm_config=llm_config,
+            default_auto_reply=default_auto_reply,
+            description=description,
+        )
+        self.register_function(
+            function_map={
+                "call_gui_agent": lambda **args: self._call_gui_agent(**args, screen_width=screen_width, screen_height=screen_height),
+                "call_coding_agent": lambda **args: self._call_coding_agent(**args),
+            }
+        )
+        self._code_execution_config = code_execution_config
+        self.cua_config = {
+            "max_steps": cua_max_steps,
+            "sleep_after_execution": sleep_after_execution,
+            "truncate_history_inputs": truncate_history_inputs,
+        }
+        self.env = DesktopEnv(
+            path_to_vm=path_to_vm,
+            provider_name=provider_name,
+            os_type="Ubuntu",
+            action_space="pyautogui",
+            snapshot_name="init_state",
+            require_a11y_tree=observation_type in ["a11y_tree", "screenshot_a11y_tree", "som"],
+        )
+        self.history_save_dir = history_save_dir
+        self.cua_call_count = 0
+        self.coding_call_count = 0
+        self.coding_max_steps = coding_max_steps
+        self.llm_config = llm_config
+        self.llm_model = llm_model
+
+    def reset(self, task_config: dict[str, Any]):
+        obs = self.env.reset(task_config=task_config)
+        print(f"VM started on localhost:{self.env.vnc_port}", flush=True)
+        return obs
+
+    def _call_gui_agent(self, task: str, screen_width: int = 1920, screen_height: int = 1080) -> str:
+        """Run a GUI agent to solve the task."""
+        cua_path = os.path.join(self.history_save_dir, f'cua_output_{self.cua_call_count}')
+        if not os.path.exists(cua_path):
+            os.makedirs(cua_path)
+        try:
+            history_inputs, result, cost = run_cua(self.env,
+                                                   task,
+                                                   save_path=cua_path,
+                                                   max_steps=self.cua_config["max_steps"],
+                                                   screen_width=screen_width,
+                                                   screen_height=screen_height,
+                                                   sleep_after_execution=self.cua_config["sleep_after_execution"],
+                                                   truncate_history_inputs=self.cua_config["truncate_history_inputs"])
+            screenshot = self.env.controller.get_screenshot()
+
+            with open(os.path.join(cua_path, "history_inputs.json"), "w") as f:
+                json.dump(history_inputs, f)
+            with open(os.path.join(cua_path, "result.txt"), "w") as f:
+                f.write(result)
+            with open(os.path.join(cua_path, "cost.txt"), "w") as f:
+                f.write(str(cost))
+            self.cua_call_count += 1
+
+        except Exception:
+            return f"# Response from GUI agent error: {traceback.format_exc()}"
+
+        if "TERMINATE" in result:
+            result = result.replace("TERMINATE", "").strip()
+            if result == "":
+                result = "Task completed. Please check the screenshot."
+        else:
+            result = f"I didn't complete the task and I have to go. Now I'm working on \"{result}\", please check the current screenshot."
+        return f"# Response from GUI agent: {result}<img data:image/png;base64,{base64.b64encode(screenshot).decode('utf-8')}>"
+    
+    def _call_coding_agent(self, task: str, environment: str) -> str:
+        """Run a coding agent to solve the task."""
+        default_auto_reply = "I'm a code interpreter and I can only execute your code or end the conversation. If you think the problem is solved, please reply me only with 'TERMINATE'."
+        try:
+            screenshot = self.env.controller.get_screenshot()
+            coding_agent = MultimodalConversableAgent(
+                name="coding_agent",
+                llm_config=LLMConfig(api_type="openai", model=self.llm_model),
+                system_message=CODER_SYSTEM_MESSAGE,
+            )
+            code_interpreter = TerminalProxyAgent(
+                name="code_interpreter",
+                human_input_mode="NEVER",
+                code_execution_config={
+                    "use_docker": False,
+                    "timeout": 300,
+                    "last_n_messages": 1,
+                },
+                max_consecutive_auto_reply = None,
+                default_auto_reply = default_auto_reply,
+                description = None,
+                is_termination_msg=lambda x: x.get("content", "") and x.get("content", "")[0]["text"].lower() == "terminate",
+                env=self.env,
+            )
+            code_interpreter.initiate_chat(
+                recipient=coding_agent,
+                message=f"# Task\n{task}\n\n# Environment\n{environment}<img data:image/png;base64,{base64.b64encode(screenshot).decode('utf-8')}>",
+                max_turns=self.coding_max_steps,
+            )
+        
+            chat_history = []
+            key = list(code_interpreter.chat_messages.keys())[0]
+            chat_messages = code_interpreter.chat_messages[key]
+            for item in chat_messages:
+                for content in item['content']:
+                    if content['type'] == 'image_url':
+                        content['image_url']['url'] = '<image>'
+                chat_history.append(item)
+            
+            if not os.path.exists(os.path.join(self.history_save_dir, f'coding_output_{self.coding_call_count}')):
+                os.makedirs(os.path.join(self.history_save_dir, f'coding_output_{self.coding_call_count}'))
+                
+            with open(os.path.join(self.history_save_dir, f'coding_output_{self.coding_call_count}', "chat_history.json"), "w") as f:
+                json.dump(chat_history, f)
+            self.coding_call_count += 1
+
+            # Review the group chat history
+            summarizer = ConversableAgent(
+                name="summarizer",
+                llm_config=LLMConfig(api_type="openai", model=self.llm_model),
+                system_message=self.CONVERSATION_REVIEW_PROMPT,
+            )
+            summarized_history = summarizer.generate_oai_reply(
+                messages=[
+                    {
+                        "role": "user",
+                        "content": self.CONVERSATION_REVIEW_PROMPT.format(chat_history=chat_history),
+                    }
+                ]
+            )[1]
+        except Exception:
+            return f"# Call coding agent error: {traceback.format_exc()}"
+
+        screenshot = self.env.controller.get_screenshot()
+        return f"# Response from coding agent: {summarized_history}"
diff --git a/run_coact.py b/run_coact.py
new file mode 100644
index 0000000..3a6f21d
--- /dev/null
+++ b/run_coact.py
@@ -0,0 +1,266 @@
+import argparse
+import base64
+import glob
+import shutil
+import traceback
+from typing import Dict, List
+import json
+import os
+from mm_agents.coact.operator_agent import OrchestratorAgent, OrchestratorUserProxyAgent
+from mm_agents.coact.autogen import LLMConfig
+import logging
+from multiprocessing import Pool, cpu_count
+from functools import partial
+
+
+logger = logging.getLogger("desktopenv")
+
+
+TASK_DESCRIPTION = """# Your role
+You are a task solver, you need to try your best to complete a computer-using task step-by-step.
+- Based on the task description AND the screenshot, provide a detailed plan. The screenshot includes the current state of the computer, and it includes a lot of hints.
+- Do not do anything else out of the user's instruction, like discover the file out of the user specific location or imagine the conditions. This will affect the judgement of the infeasible task.
+- When you see the interactable element in the screenshot is dense (like a spreadsheet is opening), you MUST try coding agent first.
+- When you let coding agent to modify an existing file, you MUST let it check the file content first.
+- After coding agent is done, you MUST check the final result carefully either by looking into the screenshot or by GUI agent and make sure EVERY value is in the desired position (e.g., the required cells in the spreadsheet are filled).
+- When you call GUI agent, it will have a **20-step** budget to complete your task. Each step is a one-time interaction with OS like mouse click or keyboard typing. Please take this into account when you plan the actions.
+- Remember to save the file (if applicable) before completing the task.
+
+# Your skills
+You can use the following tools to solve the task. You can only call one of gui agent or coding agent per reply:
+- call_coding_agent: Let a coding agent to solve a task. Coding agent can write python or bash code to modify everything on the computer. It requires a environment description and a detailed task description.
+- call_gui_agent: Let a GUI agent to solve a task. GUI agent can operate the computer by clicking and typing (not that accurate). It will have a **20-step** budget to complete your task. Require a detailed task description.
+
+# About the task
+- Check every screenshot carefully and see if it fulfills the task requirement.
+- If the task is completed, reply with "TERMINATE" to end the conversation.
+- If you think the task is impossible to complete (no file, wrong environment, etc.), reply with "INFEASIBLE" to end the conversation.
+- TERMINATE and INFEASIBLE are used to determine if the task is completed. Therefore, do not use it in your response unless the task is completed.
+
+# User task
+{instruction}
+Please first check carefully if my task is possible to complete. If not, reply with "INFEASIBLE".
+If possible to complete, please complete this task on my computer. I will not provide further information to you.
+"""
+
+
+def config() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description="Run end-to-end evaluation on the benchmark"
+    )
+
+    # environment config
+    parser.add_argument("--path_to_vm", type=str, default=os.environ["VMS_DIR"] + "/Ubuntu.qcow2")
+    parser.add_argument("--screen_width", type=int, default=1920)
+    parser.add_argument("--screen_height", type=int, default=1080)
+    parser.add_argument("--sleep_after_execution", type=float, default=0.5)
+
+    # agent config
+    parser.add_argument("--oai_config_path", type=str, default="OAI_CONFIG_LIST")
+    parser.add_argument("--orchestrator_model", type=str, default="o3")
+    parser.add_argument("--coding_model", type=str, default="o4-mini")
+    parser.add_argument("--cua_model", type=str, default="computer-use-preview")
+    parser.add_argument("--orchestrator_max_steps", type=int, default=15)
+    parser.add_argument("--coding_max_steps", type=int, default=20)
+    parser.add_argument("--cua_max_steps", type=int, default=25)
+    parser.add_argument("--cut_off_steps", type=int, default=150)
+
+    # example config
+    parser.add_argument("--domain", type=str, default="all")
+    parser.add_argument(
+        "--test_all_meta_path", type=str, default="evaluation_examples/test_all.json"
+    )
+    parser.add_argument(
+        "--test_config_base_dir", type=str, default="evaluation_examples/examples"
+    )
+
+    # logging related
+    parser.add_argument("--result_dir", type=str, default="./results")
+    parser.add_argument("--num_envs", type=int, default=1, help="Number of environments to run in parallel")
+    
+    args = parser.parse_args()
+    return args
+
+
+def process_task(task_info, 
+                 path_to_vm,
+                 orchestrator_model="o3",
+                 coding_model='o4-mini',
+                 save_dir='results',
+                 orchestrator_max_steps=15,
+                 cua_max_steps=25,
+                 coding_max_steps=20,
+                 cut_off_steps=150,
+                 screen_width=1920,
+                 screen_height=1080,
+                 sleep_after_execution=0.5,
+                 config_path="OAI_CONFIG_LIST"):
+    """Worker function to process a single task"""
+    domain, ex_id, cfg = task_info
+    
+    # Recreate llm_config inside the worker process
+    llm_config = LLMConfig.from_json(path=config_path).where(model=orchestrator_model)
+    
+    history_save_dir = os.path.join(save_dir, "coact", f"{domain}/{ex_id}")
+    if not os.path.exists(history_save_dir):
+        os.makedirs(history_save_dir)
+    
+    task_config = json.load(open(cfg))
+    retry = 0
+
+    while True:
+        try:
+            with llm_config:
+                orchestrator = OrchestratorAgent(
+                    name="orchestrator",
+                )
+                orchestrator_proxy = OrchestratorUserProxyAgent(
+                    name="orchestrator_proxy",
+                    is_termination_msg=lambda x: x.get("content", "") and ("terminate" in x.get("content", "")[0]["text"].lower() or "infeasible" in x.get("content", "")[0]["text"].lower()),
+                    human_input_mode="NEVER",
+                    path_to_vm=path_to_vm,
+                    screen_width=screen_width,
+                    screen_height=screen_height,
+                    sleep_after_execution=sleep_after_execution,
+                    code_execution_config=False,
+                    history_save_dir=history_save_dir,
+                    llm_model=coding_model,
+                    truncate_history_inputs=cua_max_steps + 1,
+                    cua_max_steps=cua_max_steps,
+                    coding_max_steps=coding_max_steps,
+                )
+
+            obs = orchestrator_proxy.reset(task_config=task_config)
+
+            orchestrator_proxy.initiate_chat(
+                recipient=orchestrator,
+                message=TASK_DESCRIPTION.format(instruction=task_config["instruction"]) + "<img data:image/png;base64," + base64.b64encode(obs["screenshot"]).decode("utf-8") + ">",
+                max_turns=orchestrator_max_steps
+            )
+            
+            chat_history = []
+            key = list(orchestrator_proxy.chat_messages.keys())[0]
+            chat_messages = orchestrator_proxy.chat_messages[key]
+            for item in chat_messages:
+                item.pop('tool_responses', None)
+                if item.get('role', None) in ['tool', 'assistant'] and item.get('content', None):
+                    for msg in item['content']:
+                        if msg.get('type', None) == 'image_url':
+                            msg['image_url'] = "<image>"
+                chat_history.append(item)
+            
+            with open(os.path.join(history_save_dir, f'chat_history.json'), "w") as f:
+                json.dump(chat_history, f)
+
+            if chat_history[-1]['role'] == 'user' and 'INFEASIBLE' in chat_history[-1]['content'][0]['text']:
+                orchestrator_proxy.env.action_history.append("FAIL")
+
+            cua_steps = len(glob.glob(f"{history_save_dir}/cua_output*/step_*.png"))
+            coding_paths = glob.glob(f"{history_save_dir}/coding_output*/chat_history.json")
+            coding_steps = 0
+            for hist in coding_paths:
+                with open(hist, 'r') as f:
+                    hist = json.dumps(json.load(f))
+                    coding_steps += hist.count('exitcode:')
+            if cua_steps + coding_steps > cut_off_steps:
+                score = 0.0
+            else:
+                score = orchestrator_proxy.env.evaluate()
+            print(f"Score: {score}")
+            
+            with open(os.path.join(history_save_dir, f'result.txt'), "w") as f:
+                f.write(str(score))
+            break
+                    
+        except Exception as e:
+            retry += 1
+            if retry < 3:
+                shutil.rmtree(history_save_dir)
+                os.makedirs(history_save_dir)
+                print(f"Retry {retry} times, error: {str(e)}")
+                traceback.print_exc()
+                continue
+
+            print(f"Error processing task {domain}/{ex_id}")
+            traceback.print_exc()
+            score = 0.0
+            with open(os.path.join(history_save_dir, f'result.txt'), "w") as f:
+                f.write(str(score))
+            with open(os.path.join(history_save_dir, f'err_reason.txt'), "w") as f:
+                f.write(f"Fatal error: {str(e)}")
+        finally:
+            if orchestrator_proxy.env is not None:
+                orchestrator_proxy.env.close()
+    
+    return domain, score
+
+
+if __name__ == "__main__":
+    args = config()
+
+    with open(args.test_all_meta_path, encoding="utf-8") as f:
+        test_all_meta = json.load(f)
+    if args.domain != "all":
+        test_all_meta = {args.domain: test_all_meta[args.domain]}
+
+    tasks = []
+    scores: Dict[str, List[float]] = {}
+    for domain in test_all_meta:
+        scores[domain] = []
+        for ex_id in test_all_meta[domain]:
+            if os.path.exists(os.path.join(args.result_dir, 'coact', f"{domain}/{ex_id}/result.txt")):
+                result = open(os.path.join(args.result_dir, 'coact', f"{domain}/{ex_id}/result.txt"), "r").read()
+                print(f"Results already exist in {domain}/{ex_id}, result: {result}")
+                continue
+            cfg = os.path.join(args.test_config_base_dir, f"{domain}/{ex_id}.json")
+            tasks.append((domain, ex_id, cfg))
+    # Check if there are any tasks to process
+    if not tasks:
+        print("No tasks to process. All tasks have already been completed.")
+        # Print summary of existing results
+        print("\n=== Summary of Existing Results ===")
+        for domain in test_all_meta:
+            domain_scores = []
+            for ex_id in test_all_meta[domain]:
+                score_file = os.path.join(args.result_dir, 'coact', f"{domain}/{ex_id}/result.txt")
+                if os.path.exists(score_file):
+                    with open(score_file, "r") as f:
+                        domain_scores.append(float(f.read()))
+            if domain_scores:
+                avg_score = sum(domain_scores) / len(domain_scores)
+                print(f"{domain}: {len(domain_scores)} tasks, average score: {avg_score:.2f}")
+    else:
+        # Use multiprocessing to process tasks in parallel
+        # Determine number of workers (you can adjust this based on your system)
+        num_workers = min(cpu_count() // 2, args.num_envs)  # Use half of CPU cores, max 4
+        print(f"Processing {len(tasks)} tasks with {num_workers} workers...")
+
+        # Create a partial function with fixed config_path, model and debug
+        process_func = partial(process_task, 
+                               path_to_vm=args.path_to_vm,
+                               save_dir=args.result_dir,
+                               coding_model=args.coding_model,
+                               orchestrator_model=args.orchestrator_model,
+                               config_path=args.oai_config_path, 
+                               orchestrator_max_steps=args.orchestrator_max_steps,
+                               cua_max_steps=args.cua_max_steps,
+                               coding_max_steps=args.coding_max_steps,
+                               cut_off_steps=args.cut_off_steps,
+                               screen_width=args.screen_width,
+                               screen_height=args.screen_height,
+                               sleep_after_execution=args.sleep_after_execution)
+
+        # Process tasks in parallel
+        with Pool(processes=num_workers) as pool:
+            results = pool.map(process_func, tasks)
+
+        # Collect scores from results
+        for domain, score in results:
+            scores[domain].append(score)
+
+        # Print summary
+        print("\n=== Task Processing Complete ===")
+        for domain in scores:
+            if scores[domain]:
+                avg_score = sum(scores[domain]) / len(scores[domain])
+                print(f"{domain}: {len(scores[domain])} tasks, average score: {avg_score:.2f}")