From b370170faf77c4e411940c1da246e5a56084215a Mon Sep 17 00:00:00 2001 From: Li Jiang Date: Tue, 6 Aug 2024 12:02:12 +0800 Subject: [PATCH 1/3] Stop retrieve more docs if all docs have been returned (#3282) --- .../contrib/retrieve_user_proxy_agent.py | 4 +- notebook/agentchat_RetrieveChat.ipynb | 135 +++++++----------- 2 files changed, 56 insertions(+), 83 deletions(-) diff --git a/autogen/agentchat/contrib/retrieve_user_proxy_agent.py b/autogen/agentchat/contrib/retrieve_user_proxy_agent.py index 4842bd4e9f53..90757af6fc3e 100644 --- a/autogen/agentchat/contrib/retrieve_user_proxy_agent.py +++ b/autogen/agentchat/contrib/retrieve_user_proxy_agent.py @@ -519,7 +519,7 @@ def _generate_retrieve_user_reply( self.problem, self.n_results * (2 * _tmp_retrieve_count + 1), self._search_string ) doc_contents = self._get_context(self._results) - if doc_contents: + if doc_contents or self.n_results * (2 * _tmp_retrieve_count + 1) >= len(self._results[0]): break elif update_context_case2: # Use the current intermediate info as the query text to retrieve docs, and each time we append the top similar @@ -531,7 +531,7 @@ def _generate_retrieve_user_reply( ) self._get_context(self._results) doc_contents = "\n".join(self._doc_contents) # + "\n" + "\n".join(self._intermediate_answers) - if doc_contents: + if doc_contents or self.n_results * (2 * _tmp_retrieve_count + 1) >= len(self._results[0]): break self.clear_history() diff --git a/notebook/agentchat_RetrieveChat.ipynb b/notebook/agentchat_RetrieveChat.ipynb index adb13ac47bd5..6fefcd3ba44c 100644 --- a/notebook/agentchat_RetrieveChat.ipynb +++ b/notebook/agentchat_RetrieveChat.ipynb @@ -48,14 +48,14 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "models to use: ['gpt-3.5-turbo-0125']\n" + "models to use: ['gpt-35-turbo', 'gpt4-1106-preview', 'gpt-4o']\n" ] } ], @@ -73,9 +73,7 @@ "# a vector database instance\n", "from autogen.retrieve_utils import TEXT_FORMATS\n", "\n", - "config_list = [\n", - " {\"model\": \"gpt-3.5-turbo-0125\", \"api_key\": \"\", \"api_type\": \"openai\"},\n", - "]\n", + "config_list = autogen.config_list_from_json(\"OAI_CONFIG_LIST\")\n", "\n", "assert len(config_list) > 0\n", "print(\"models to use: \", [config_list[i][\"model\"] for i in range(len(config_list))])" @@ -107,7 +105,7 @@ "output_type": "stream", "text": [ "Accepted file formats for `docs_path`:\n", - "['odt', 'xml', 'pdf', 'docx', 'html', 'md', 'htm', 'csv', 'rst', 'org', 'ppt', 'doc', 'log', 'json', 'epub', 'jsonl', 'pptx', 'yml', 'xlsx', 'tsv', 'txt', 'yaml', 'msg', 'rtf']\n" + "['txt', 'json', 'csv', 'tsv', 'md', 'html', 'htm', 'rtf', 'rst', 'jsonl', 'log', 'xml', 'yaml', 'yml', 'pdf']\n" ] } ], @@ -120,7 +118,16 @@ "cell_type": "code", "execution_count": 3, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/workspace/anaconda3/envs/autogen312/lib/python3.12/site-packages/sentence_transformers/cross_encoder/CrossEncoder.py:11: TqdmExperimentalWarning: Using `tqdm.autonotebook.tqdm` in notebook mode. Use `tqdm.tqdm` instead to force console mode (e.g. in jupyter console)\n", + " from tqdm.autonotebook import tqdm, trange\n" + ] + } + ], "source": [ "# 1. create an RetrieveAssistantAgent instance named \"assistant\"\n", "assistant = RetrieveAssistantAgent(\n", @@ -160,6 +167,7 @@ " # \"client\": chromadb.PersistentClient(path=\"/tmp/chromadb\"), # deprecated, use \"vector_db\" instead\n", " \"vector_db\": \"chroma\", # to use the deprecated `client` parameter, set to None and uncomment the line above\n", " \"overwrite\": False, # set to True if you want to overwrite an existing collection\n", + " \"get_or_create\": True, # set to False if don't want to reuse an existing collection\n", " },\n", " code_execution_config=False, # set to False if you don't want to execute the code\n", ")" @@ -188,7 +196,8 @@ "name": "stderr", "output_type": "stream", "text": [ - "2024-04-07 17:30:56,955 - autogen.agentchat.contrib.retrieve_user_proxy_agent - INFO - \u001b[32mUse the existing collection `autogen-docs`.\u001b[0m\n" + "2024-08-02 06:30:11,303 - autogen.agentchat.contrib.retrieve_user_proxy_agent - INFO - \u001b[32mUse the existing collection `autogen-docs`.\u001b[0m\n", + "2024-08-02 06:30:11,485 - autogen.agentchat.contrib.retrieve_user_proxy_agent - INFO - Found 2 chunks.\u001b[0m\n" ] }, { @@ -202,7 +211,6 @@ "name": "stderr", "output_type": "stream", "text": [ - "2024-04-07 17:30:59,609 - autogen.agentchat.contrib.retrieve_user_proxy_agent - INFO - Found 2 chunks.\u001b[0m\n", "Number of requested results 20 is greater than number of elements in index 2, updating n_results = 2\n" ] }, @@ -361,65 +369,53 @@ "--------------------------------------------------------------------------------\n", "\u001b[33massistant\u001b[0m (to ragproxyagent):\n", "\n", - "To perform a classification task using FLAML and use Spark to do parallel training for 30 seconds and force cancel jobs if the time limit is reached, you can follow these steps:\n", - "\n", - "1. First, convert your data into Spark dataframe format using `to_pandas_on_spark` function from `flaml.automl.spark.utils` module.\n", - "2. Then, format your data for use SparkML models by using `VectorAssembler`.\n", - "3. Define your AutoML settings, including the `metric`, `time_budget`, and `task`.\n", - "4. Use `AutoML` from `flaml` to run AutoML with SparkML models by setting `use_spark` to `true`, and `estimator_list` to a list of spark-based estimators, like `[\"lgbm_spark\"]`.\n", - "5. Set `n_concurrent_trials` to the desired number of parallel jobs and `force_cancel` to `True` to cancel the jobs if the time limit is reached.\n", - "\n", - "Here's an example code snippet for performing classification using FLAML and Spark:\n", - "\n", "```python\n", - "import pandas as pd\n", + "import flaml\n", "from flaml.automl.spark.utils import to_pandas_on_spark\n", "from pyspark.ml.feature import VectorAssembler\n", - "import flaml\n", + "import pandas as pd\n", "\n", - "# Creating a dictionary\n", + "# Example Data (Please provide real data in practice)\n", "data = {\n", - " \"sepal_length\": [5.1, 4.9, 4.7, 4.6, 5.0],\n", - " \"sepal_width\": [3.5, 3.0, 3.2, 3.1, 3.6],\n", - " \"petal_length\": [1.4, 1.4, 1.3, 1.5, 1.4],\n", - " \"petal_width\": [0.2, 0.2, 0.2, 0.2, 0.2],\n", - " \"species\": [\"setosa\", \"setosa\", \"setosa\", \"setosa\", \"setosa\"]\n", + " \"feature1\": [0, 1, 2, 3, 4],\n", + " \"feature2\": [1, 2, 3, 4, 5],\n", + " # ... add all features you need for your classification\n", + " \"label\": ['a', 'b', 'a', 'a', 'b'], # assuming binary classification with labels 'a' and 'b'\n", "}\n", "\n", - "# Creating a pandas DataFrame\n", - "dataframe = pd.DataFrame(data)\n", - "label = \"species\"\n", + "# Convert to Pandas DataFrame\n", + "pdf = pd.DataFrame(data)\n", "\n", - "# Convert to pandas-on-spark dataframe\n", - "psdf = to_pandas_on_spark(dataframe)\n", + "# Generate pandas-on-spark dataframe\n", + "psdf = to_pandas_on_spark(pdf)\n", "\n", - "# Format data for SparkML models\n", - "columns = psdf.columns\n", - "feature_cols = [col for col in columns if col != label]\n", + "# Organize data into feature vectors and labels\n", + "label_col = \"label\"\n", + "feature_cols = [col for col in psdf.columns if col != label_col]\n", "featurizer = VectorAssembler(inputCols=feature_cols, outputCol=\"features\")\n", - "psdf = featurizer.transform(psdf.to_spark(index_col=\"index\"))[\"index\", \"features\"]\n", "\n", - "# Define AutoML settings\n", - "settings = {\n", + "# Apply the transformation\n", + "psdf = featurizer.transform(psdf.to_spark(index_col=\"index\"))[\"index\", \"features\", label_col]\n", + "\n", + "# Prepare AutoML settings\n", + "automl_settings = {\n", " \"time_budget\": 30,\n", - " \"metric\": \"accuracy\",\n", + " \"metric\": \"accuracy\", # Change this to a classification metric you prefer\n", " \"task\": \"classification\",\n", + " \"n_concurrent_trials\": 2, # Or other number that fits your Spark cluster configuration\n", + " \"use_spark\": True,\n", + " \"force_cancel\": True, # Enable force cancel to obey the time constraint\n", + " \"estimator_list\": [\"lgbm_spark\"], # Specify SparkML estimators you want to try\n", "}\n", "\n", - "# Use AutoML with SparkML models and parallel jobs\n", + "# Create an AutoML instance\n", "automl = flaml.AutoML()\n", - "automl.fit(\n", - " dataframe=psdf,\n", - " label=label,\n", - " estimator_list=[\"lgbm_spark\"],\n", - " use_spark=True,\n", - " n_concurrent_trials=2,\n", - " force_cancel=True,\n", - " **settings,\n", - ")\n", - "```\n", "\n", - "Note that the above code assumes the data is small enough to train within 30 seconds. If you have a larger dataset, you may need to increase the `time_budget` and adjust the number of parallel jobs accordingly.\n", + "# Run the AutoML search\n", + "automl.fit(dataframe=psdf, label=label_col, **automl_settings)\n", + "``` \n", + "\n", + "Remember to replace the example data with your real dataset and choose an appropriate metric for your classification task. You'll also need a configured and running Spark environment to utilize the \"use_spark\" feature.\n", "\n", "--------------------------------------------------------------------------------\n", "\u001b[33mragproxyagent\u001b[0m (to assistant):\n", @@ -439,25 +435,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "Number of requested results 60 is greater than number of elements in index 2, updating n_results = 2\n", - "Number of requested results 100 is greater than number of elements in index 2, updating n_results = 2\n", - "Number of requested results 140 is greater than number of elements in index 2, updating n_results = 2\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "VectorDB returns doc_ids: [['bdfbc921']]\n", - "VectorDB returns doc_ids: [['bdfbc921']]\n", - "VectorDB returns doc_ids: [['bdfbc921']]\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "Number of requested results 180 is greater than number of elements in index 2, updating n_results = 2\n" + "Number of requested results 60 is greater than number of elements in index 2, updating n_results = 2\n" ] }, { @@ -470,18 +448,13 @@ "\n", "TERMINATE\n", "\n", + "--------------------------------------------------------------------------------\n", + "\u001b[33mragproxyagent\u001b[0m (to assistant):\n", + "\n", + "TERMINATE\n", + "\n", "--------------------------------------------------------------------------------\n" ] - }, - { - "data": { - "text/plain": [ - "ChatResult(chat_id=None, chat_history=[{'content': 'TERMINATE', 'role': 'assistant'}], summary='', cost=({'total_cost': 0.007691, 'gpt-35-turbo': {'cost': 0.007691, 'prompt_tokens': 4242, 'completion_tokens': 664, 'total_tokens': 4906}}, {'total_cost': 0}), human_input=[])" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" } ], "source": [ @@ -2836,7 +2809,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.9" + "version": "3.12.4" }, "skip_test": "Requires interactive usage" }, From 2ab74dbfb9e0b63f3e4ce02d3ce3e911828c3d8e Mon Sep 17 00:00:00 2001 From: wenngong <76683249+wenngong@users.noreply.github.com> Date: Wed, 7 Aug 2024 00:08:10 +0800 Subject: [PATCH 2/3] avoid circular import (#3276) Co-authored-by: gongwn1 Co-authored-by: Li Jiang --- autogen/coding/base.py | 1 - 1 file changed, 1 deletion(-) diff --git a/autogen/coding/base.py b/autogen/coding/base.py index ccbfe6b92932..7c9e19d73f33 100644 --- a/autogen/coding/base.py +++ b/autogen/coding/base.py @@ -4,7 +4,6 @@ from pydantic import BaseModel, Field -from ..agentchat.agent import LLMAgent from ..types import UserMessageImageContentPart, UserMessageTextContentPart __all__ = ("CodeBlock", "CodeResult", "CodeExtractor", "CodeExecutor", "CodeExecutionConfig") From cf2fe4aa787aaecbe673cd679f9191118695d0d5 Mon Sep 17 00:00:00 2001 From: Xiaoyun Zhang Date: Tue, 6 Aug 2024 14:59:44 -0700 Subject: [PATCH 3/3] [.Net] Fix #3306 (#3310) * break conversation when orchestartor return null * enable test on different OS --- .github/workflows/dotnet-build.yml | 12 +++++++-- .../Extension/GroupChatExtension.cs | 7 ++++++ .../AutoGen.Tests/GroupChat/GroupChatTests.cs | 25 +++++++++++++++++++ 3 files changed, 42 insertions(+), 2 deletions(-) diff --git a/.github/workflows/dotnet-build.yml b/.github/workflows/dotnet-build.yml index 7e50025917de..6b7056cce6dc 100644 --- a/.github/workflows/dotnet-build.yml +++ b/.github/workflows/dotnet-build.yml @@ -43,12 +43,16 @@ jobs: if: steps.filter.outputs.workflows == 'true' build: name: Dotnet Build - runs-on: ubuntu-latest needs: paths-filter if: needs.paths-filter.outputs.hasChanges == 'true' defaults: run: working-directory: dotnet + strategy: + fail-fast: false + matrix: + os: [ ubuntu-latest, macos-latest, windows-latest ] + runs-on: ${{ matrix.os }} steps: - uses: actions/checkout@v4 with: @@ -92,7 +96,7 @@ jobs: - name: Setup dotnet uses: actions/setup-dotnet@v4 with: - global-json-file: dotnet/global.json + dotnet-version: '8.0.x' - name: publish AOT testApp, assert static analysis warning count, and run the app shell: pwsh @@ -181,12 +185,14 @@ jobs: env: AZURE_ARTIFACTS_FEED_URL: https://devdiv.pkgs.visualstudio.com/DevDiv/_packaging/AutoGen/nuget/v3/index.json NUGET_AUTH_TOKEN: ${{ secrets.AZURE_DEVOPS_TOKEN }} + continue-on-error: true - name: Publish nightly package to github package run: | echo "Publish nightly package to github package" echo "ls output directory" ls -R ./output/nightly dotnet nuget push --api-key ${{ secrets.GITHUB_TOKEN }} --source "https://nuget.pkg.github.com/microsoft/index.json" ./output/nightly/*.nupkg --skip-duplicate + continue-on-error: true - name: Publish nightly package to agentchat myget feed run: | echo "Publish nightly package to agentchat myget feed" @@ -195,3 +201,5 @@ jobs: dotnet nuget push --api-key ${{ secrets.MYGET_TOKEN }} --source "https://www.myget.org/F/agentchat/api/v3/index.json" ./output/nightly/*.nupkg --skip-duplicate env: MYGET_TOKEN: ${{ secrets.MYGET_TOKEN }} + continue-on-error: true + diff --git a/dotnet/src/AutoGen.Core/Extension/GroupChatExtension.cs b/dotnet/src/AutoGen.Core/Extension/GroupChatExtension.cs index 6b17a2b93fd6..89da7708797c 100644 --- a/dotnet/src/AutoGen.Core/Extension/GroupChatExtension.cs +++ b/dotnet/src/AutoGen.Core/Extension/GroupChatExtension.cs @@ -43,6 +43,13 @@ public static async IAsyncEnumerable SendAsync( while (maxRound-- > 0) { var messages = await groupChat.CallAsync(chatHistory, maxRound: 1, cancellationToken); + + // if no new messages, break the loop + if (messages.Count() == chatHistory.Count()) + { + yield break; + } + var lastMessage = messages.Last(); yield return lastMessage; diff --git a/dotnet/test/AutoGen.Tests/GroupChat/GroupChatTests.cs b/dotnet/test/AutoGen.Tests/GroupChat/GroupChatTests.cs index 19ca02ae92fa..9c2d2ce8197a 100644 --- a/dotnet/test/AutoGen.Tests/GroupChat/GroupChatTests.cs +++ b/dotnet/test/AutoGen.Tests/GroupChat/GroupChatTests.cs @@ -85,4 +85,29 @@ public async Task ItSendAsyncDoesntAddDuplicateInitializeMessagesTest() chatHistory.Count().Should().Be(2); } + + [Fact] + public async Task ItTerminateConversationWhenNoSpeakerAvailable() + { + // fix #3306 + var alice = new DefaultReplyAgent("Alice", "I am alice"); + var bob = new DefaultReplyAgent("Bob", "I am bob"); + var cathy = new DefaultReplyAgent("Cathy", $"I am cathy, {GroupChatExtension.TERMINATE}"); + + var orchestrator = Mock.Of(); + Mock.Get(orchestrator).Setup(x => x.GetNextSpeakerAsync(It.IsAny(), It.IsAny())) + .ReturnsAsync((IAgent?)null); + + var groupChat = new GroupChat([alice, bob, cathy], orchestrator); + + var chatHistory = new List(); + + var maxRound = 10; + await foreach (var message in groupChat.SendAsync(chatHistory, maxRound)) + { + chatHistory.Add(message); + } + + chatHistory.Count().Should().Be(0); + } }