From 756937fb2c8998d4ddfdf6f2291d89bad58e0d3f Mon Sep 17 00:00:00 2001 From: Evan Mattson <35585003+moonbox3@users.noreply.github.com> Date: Fri, 5 Jan 2024 10:31:57 -0500 Subject: [PATCH 1/5] Python: Handle errors if no event loop running in current thread. (#4485) ### Motivation and Context If invoking multiple functions, there may not be an event loop running in the current thread. The check for the event loop can throw an error, which is seen when trying to run functions in a loop, as an example. ### Description Adding a try catch to handle an errors when checking for this event loop. ### Contribution Checklist - [X] The code builds clean without any errors or warnings - [X] The PR follows the [SK Contribution Guidelines](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md) and the [pre-submission formatting script](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md#development-scripts) raises no violations - [X] All unit tests pass, and I have added new tests where possible - [X] I didn't break anyone :smile: Co-authored-by: Evan Mattson --- python/semantic_kernel/orchestration/sk_function.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/python/semantic_kernel/orchestration/sk_function.py b/python/semantic_kernel/orchestration/sk_function.py index 64ce94f8bb30..5e8b7b0753b2 100644 --- a/python/semantic_kernel/orchestration/sk_function.py +++ b/python/semantic_kernel/orchestration/sk_function.py @@ -366,7 +366,10 @@ def invoke( if input is not None: context.variables.update(input) - loop = asyncio.get_running_loop() if asyncio.get_event_loop().is_running() else None + try: + loop = asyncio.get_running_loop() if asyncio.get_event_loop().is_running() else None + except RuntimeError: + loop = None if loop and loop.is_running(): coroutine_function = self._invoke_semantic_async if self.is_semantic else self._invoke_native_async From 8618cd32ef9111188c07536a974cb47902e1c42f Mon Sep 17 00:00:00 2001 From: Evan Mattson <35585003+moonbox3@users.noreply.github.com> Date: Fri, 5 Jan 2024 11:35:49 -0500 Subject: [PATCH 2/5] Python: Bump Python Package version for release. Update notebook refs to use AIRequestSettings. (#4478) ### Motivation and Context Bump Python Package version for release. Update notebook refs and request settings to use the new AIRequestSettings classes. Fix hugging face bug that requires generator input as text_inputs instead of prompt. Add a hugging face request settings unit test. ### Description Bump Python Package version for release. Update notebook refs to point to new package version. ### Contribution Checklist - [X] The code builds clean without any errors or warnings - [X] The PR follows the [SK Contribution Guidelines](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md) and the [pre-submission formatting script](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md#development-scripts) raises no violations - [X] All unit tests pass, and I have added new tests where possible - [X] I didn't break anyone :smile: --------- Co-authored-by: Evan Mattson --- python/notebooks/00-getting-started.ipynb | 4 +- .../01-basic-loading-the-kernel.ipynb | 25 +- .../02-running-prompts-from-file.ipynb | 13 +- .../03-semantic-function-inline.ipynb | 22 +- .../notebooks/04-context-variables-chat.ipynb | 20 +- python/notebooks/05-using-the-planner.ipynb | 44 +- .../notebooks/06-memory-and-embeddings.ipynb | 1074 +++++++++-------- .../07-hugging-face-for-skills.ipynb | 4 +- .../notebooks/08-native-function-inline.ipynb | 4 +- .../notebooks/09-groundedness-checking.ipynb | 4 +- .../10-multiple-results-per-prompt.ipynb | 119 +- .../notebooks/11-streaming-completions.ipynb | 94 +- .../weaviate-persistent-memory.ipynb | 1036 ++++++++-------- python/pyproject.toml | 2 +- .../openai_logit_bias.py | 33 +- .../ai/hugging_face/hf_request_settings.py | 2 +- .../services/hf_text_completion.py | 2 +- .../open_ai_request_settings.py | 2 +- 18 files changed, 1319 insertions(+), 1185 deletions(-) diff --git a/python/notebooks/00-getting-started.ipynb b/python/notebooks/00-getting-started.ipynb index 8fe6a3374e71..db08ad662d99 100644 --- a/python/notebooks/00-getting-started.ipynb +++ b/python/notebooks/00-getting-started.ipynb @@ -16,7 +16,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -57,7 +57,7 @@ "\n", "api_key, org_id = sk.openai_settings_from_dot_env()\n", "\n", - "kernel.add_chat_service(\"chat-gpt\", OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id))" + "kernel.add_chat_service(\"chat-gpt\", OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo-1106\", api_key=api_key, org_id=org_id))" ] }, { diff --git a/python/notebooks/01-basic-loading-the-kernel.ipynb b/python/notebooks/01-basic-loading-the-kernel.ipynb index da00f754ea09..87dbadb87fcf 100644 --- a/python/notebooks/01-basic-loading-the-kernel.ipynb +++ b/python/notebooks/01-basic-loading-the-kernel.ipynb @@ -25,17 +25,20 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import AzureChatCompletion, OpenAIChatCompletion" + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureChatCompletion,\n", + " OpenAIChatCompletion,\n", + ")" ] }, { @@ -48,7 +51,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -85,13 +88,13 @@ " )\n", ")\n", "\n", - "kernel.add_chat_service( # We are adding a text service\n", - " \"OpenAI_chat_gpt\", # The alias we can use in prompt templates' config.json\n", + "kernel.add_chat_service( # We are adding a text service\n", + " \"OpenAI_chat_gpt\", # The alias we can use in prompt templates' config.json\n", " OpenAIChatCompletion(\n", - " ai_model_id=\"gpt-3.5-turbo\", # OpenAI Model Name\n", - " api_key=\"...your OpenAI API Key...\", # OpenAI API key\n", - " org_id=\"...your OpenAI Org ID...\" # *optional* OpenAI Organization ID\n", - " )\n", + " ai_model_id=\"gpt-3.5-turbo\", # OpenAI Model Name\n", + " api_key=\"...your OpenAI API Key...\", # OpenAI API key\n", + " org_id=\"...your OpenAI Org ID...\", # *optional* OpenAI Organization ID\n", + " ),\n", ")" ] }, @@ -143,7 +146,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" }, "polyglot_notebook": { "kernelInfo": { diff --git a/python/notebooks/02-running-prompts-from-file.ipynb b/python/notebooks/02-running-prompts-from-file.ipynb index c15d38e16e7f..17519257d6c3 100644 --- a/python/notebooks/02-running-prompts-from-file.ipynb +++ b/python/notebooks/02-running-prompts-from-file.ipynb @@ -89,7 +89,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -100,7 +100,10 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import AzureChatCompletion, OpenAIChatCompletion\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureChatCompletion,\n", + " OpenAIChatCompletion,\n", + ")\n", "\n", "kernel = sk.Kernel()\n", "\n", @@ -109,7 +112,9 @@ "# Configure AI service used by the kernel\n", "if useAzureOpenAI:\n", " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your chat model\n", + " azure_chat_service = AzureChatCompletion(\n", + " deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key\n", + " ) # set the deployment name to the value of your chat model\n", " kernel.add_chat_service(\"chat_completion\", azure_chat_service)\n", "else:\n", " api_key, org_id = sk.openai_settings_from_dot_env()\n", @@ -192,7 +197,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/03-semantic-function-inline.ipynb b/python/notebooks/03-semantic-function-inline.ipynb index fa633ef30a57..f5c90d8b1d2f 100644 --- a/python/notebooks/03-semantic-function-inline.ipynb +++ b/python/notebooks/03-semantic-function-inline.ipynb @@ -55,7 +55,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -66,7 +66,10 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import AzureTextCompletion, OpenAITextCompletion\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureTextCompletion,\n", + " OpenAITextCompletion,\n", + ")\n", "\n", "kernel = sk.Kernel()\n", "\n", @@ -75,7 +78,9 @@ "# Configure AI service used by the kernel\n", "if useAzureOpenAI:\n", " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " azure_text_service = AzureTextCompletion(deployment_name=\"text\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your text model\n", + " azure_text_service = AzureTextCompletion(\n", + " deployment_name=\"text\", endpoint=endpoint, api_key=api_key\n", + " ) # set the deployment name to the value of your text model\n", " kernel.add_text_completion_service(\"dv\", azure_text_service)\n", "else:\n", " api_key, org_id = sk.openai_settings_from_dot_env()\n", @@ -196,7 +201,10 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import AzureChatCompletion, OpenAIChatCompletion\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureChatCompletion,\n", + " OpenAIChatCompletion,\n", + ")\n", "\n", "kernel = sk.Kernel()\n", "\n", @@ -205,7 +213,9 @@ "# Configure AI service used by the kernel\n", "if useAzureOpenAI:\n", " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your chat model\n", + " azure_chat_service = AzureChatCompletion(\n", + " deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key\n", + " ) # set the deployment name to the value of your chat model\n", " kernel.add_chat_service(\"chat_completion\", azure_chat_service)\n", "else:\n", " api_key, org_id = sk.openai_settings_from_dot_env()\n", @@ -241,7 +251,7 @@ "\n", "summary = tldr_function(text)\n", "\n", - "print(f\"Output: {summary}\") # Output: Robots must not harm humans." + "print(f\"Output: {summary}\") # Output: Robots must not harm humans." ] } ], diff --git a/python/notebooks/04-context-variables-chat.ipynb b/python/notebooks/04-context-variables-chat.ipynb index baed381d49b1..8eff5b7f3838 100644 --- a/python/notebooks/04-context-variables-chat.ipynb +++ b/python/notebooks/04-context-variables-chat.ipynb @@ -26,7 +26,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -37,7 +37,10 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import AzureChatCompletion, OpenAIChatCompletion\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureChatCompletion,\n", + " OpenAIChatCompletion,\n", + ")\n", "\n", "kernel = sk.Kernel()\n", "\n", @@ -46,10 +49,16 @@ "# Configure AI service used by the kernel\n", "if useAzureOpenAI:\n", " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " kernel.add_chat_service(\"chat_completion\", AzureChatCompletion(deployment_name=deployment, endpoint=endpoint, api_key=api_key))\n", + " kernel.add_chat_service(\n", + " \"chat_completion\",\n", + " AzureChatCompletion(deployment_name=deployment, endpoint=endpoint, api_key=api_key),\n", + " )\n", "else:\n", " api_key, org_id = sk.openai_settings_from_dot_env()\n", - " kernel.add_chat_service(\"gpt-3.5\", OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id))\n" + " kernel.add_chat_service(\n", + " \"gpt-3.5\",\n", + " OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id),\n", + " )" ] }, { @@ -98,7 +107,8 @@ " function_name=\"ChatBot\",\n", " max_tokens=2000,\n", " temperature=0.7,\n", - " top_p=0.5)" + " top_p=0.5,\n", + ")" ] }, { diff --git a/python/notebooks/05-using-the-planner.ipynb b/python/notebooks/05-using-the-planner.ipynb index a9f3be5bfc95..188c9dfa8464 100644 --- a/python/notebooks/05-using-the-planner.ipynb +++ b/python/notebooks/05-using-the-planner.ipynb @@ -23,7 +23,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -34,7 +34,10 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import OpenAIChatCompletion, AzureChatCompletion\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " OpenAIChatCompletion,\n", + " AzureChatCompletion,\n", + ")\n", "\n", "kernel = sk.Kernel()\n", "\n", @@ -43,10 +46,16 @@ "# Configure AI backend used by the kernel\n", "if useAzureOpenAI:\n", " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " kernel.add_chat_service(\"chat_completion\", AzureChatCompletion(deployment_name=deployment, endpoint=endpoint, api_key=api_key))\n", + " kernel.add_chat_service(\n", + " \"chat_completion\",\n", + " AzureChatCompletion(deployment_name=deployment, endpoint=endpoint, api_key=api_key),\n", + " )\n", "else:\n", " api_key, org_id = sk.openai_settings_from_dot_env()\n", - " kernel.add_chat_service(\"gpt-3.5\", OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id))" + " kernel.add_chat_service(\n", + " \"gpt-3.5\",\n", + " OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id),\n", + " )" ] }, { @@ -127,6 +136,7 @@ "outputs": [], "source": [ "from semantic_kernel.planning.basic_planner import BasicPlanner\n", + "\n", "planner = BasicPlanner()" ] }, @@ -185,7 +195,8 @@ " function_name=\"shakespeare\",\n", " skill_name=\"ShakespeareSkill\",\n", " max_tokens=2000,\n", - " temperature=0.8)" + " temperature=0.8,\n", + ")" ] }, { @@ -299,6 +310,7 @@ "outputs": [], "source": [ "from semantic_kernel.planning import SequentialPlanner\n", + "\n", "planner = SequentialPlanner(kernel)" ] }, @@ -383,6 +395,7 @@ "outputs": [], "source": [ "from semantic_kernel.planning import ActionPlanner\n", + "\n", "planner = ActionPlanner(kernel)" ] }, @@ -402,6 +415,7 @@ "outputs": [], "source": [ "from semantic_kernel.core_skills import FileIOSkill, MathSkill, TextSkill, TimeSkill\n", + "\n", "kernel.import_skill(MathSkill(), \"math\")\n", "kernel.import_skill(FileIOSkill(), \"fileIO\")\n", "kernel.import_skill(TimeSkill(), \"time\")\n", @@ -502,15 +516,17 @@ " \"\"\"\n", " A search engine skill.\n", " \"\"\"\n", + "\n", " from semantic_kernel.orchestration.sk_context import SKContext\n", - " from semantic_kernel.skill_definition import sk_function, sk_function_context_parameter\n", + " from semantic_kernel.skill_definition import (\n", + " sk_function,\n", + " sk_function_context_parameter,\n", + " )\n", "\n", " def __init__(self, connector) -> None:\n", " self._connector = connector\n", "\n", - " @sk_function(\n", - " description=\"Performs a web search for a given query\", name=\"searchAsync\"\n", - " )\n", + " @sk_function(description=\"Performs a web search for a given query\", name=\"searchAsync\")\n", " @sk_function_context_parameter(\n", " name=\"query\",\n", " description=\"The search query\",\n", @@ -564,9 +580,7 @@ "metadata": {}, "outputs": [], "source": [ - "planner = StepwisePlanner(\n", - " kernel, StepwisePlannerConfig(max_iterations=10, min_iteration_time_ms=1000)\n", - ")" + "planner = StepwisePlanner(kernel, StepwisePlannerConfig(max_iterations=10, min_iteration_time_ms=1000))" ] }, { @@ -626,10 +640,10 @@ "source": [ "for index, step in enumerate(plan._steps):\n", " print(\"Step:\", index)\n", - " print(\"Description:\",step.description)\n", + " print(\"Description:\", step.description)\n", " print(\"Function:\", step.skill_name + \".\" + step._function.name)\n", " if len(step._outputs) > 0:\n", - " print( \" Output:\\n\", str.replace(result[step._outputs[0]],\"\\n\", \"\\n \"))" + " print(\" Output:\\n\", str.replace(result[step._outputs[0]], \"\\n\", \"\\n \"))" ] } ], @@ -649,7 +663,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/06-memory-and-embeddings.ipynb b/python/notebooks/06-memory-and-embeddings.ipynb index 95e686b9ca95..0a89aceabaa2 100644 --- a/python/notebooks/06-memory-and-embeddings.ipynb +++ b/python/notebooks/06-memory-and-embeddings.ipynb @@ -1,538 +1,546 @@ { - "cells": [ - { - "attachments": {}, - "cell_type": "markdown", - "id": "68e1c158", - "metadata": {}, - "source": [ - "# Building Semantic Memory with Embeddings\n", - "\n", - "So far, we've mostly been treating the kernel as a stateless orchestration engine.\n", - "We send text into a model API and receive text out. \n", - "\n", - "In a [previous notebook](04-context-variables-chat.ipynb), we used `context variables` to pass in additional\n", - "text into prompts to enrich them with more context. This allowed us to create a basic chat experience. \n", - "\n", - "However, if you solely relied on context variables, you would quickly realize that eventually your prompt\n", - "would grow so large that you would run into the model's token limit. What we need is a way to persist state\n", - "and build both short-term and long-term memory to empower even more intelligent applications. \n", - "\n", - "To do this, we dive into the key concept of `Semantic Memory` in the Semantic Kernel. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a77bdf89", - "metadata": {}, - "outputs": [], - "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "508ad44f", - "metadata": {}, - "outputs": [], - "source": [ - "from typing import Tuple\n", - "\n", - "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import OpenAIChatCompletion, OpenAITextEmbedding, AzureChatCompletion, AzureTextEmbedding" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "d8ddffc1", - "metadata": {}, - "source": [ - "In order to use memory, we need to instantiate the Kernel with a Memory Storage\n", - "and an Embedding service. In this example, we make use of the `VolatileMemoryStore` which can be thought of as a temporary in-memory storage. This memory is not written to disk and is only available during the app session.\n", - "\n", - "When developing your app you will have the option to plug in persistent storage like Azure AI Search, Azure Cosmos Db, PostgreSQL, SQLite, etc. Semantic Memory allows also to index external data sources, without duplicating all the information as you will see further down in this notebook." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8f8dcbc6", - "metadata": {}, - "outputs": [], - "source": [ - "kernel = sk.Kernel()\n", - "\n", - "useAzureOpenAI = False\n", - "\n", - "# Configure AI service used by the kernel\n", - "if useAzureOpenAI:\n", - " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - " # next line assumes chat deployment name is \"turbo\", adjust the deployment name to the value of your chat model if needed\n", - " azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key)\n", - " # next line assumes embeddings deployment name is \"text-embedding\", adjust the deployment name to the value of your chat model if needed \n", - " azure_text_embedding = AzureTextEmbedding(deployment_name=\"text-embedding\", endpoint=endpoint, api_key=api_key)\n", - " kernel.add_chat_service(\"chat_completion\", azure_chat_service)\n", - " kernel.add_text_embedding_generation_service(\"ada\", azure_text_embedding)\n", - "else:\n", - " api_key, org_id = sk.openai_settings_from_dot_env()\n", - " oai_chat_service = OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id)\n", - " oai_text_embedding = OpenAITextEmbedding(ai_model_id=\"text-embedding-ada-002\", api_key=api_key, org_id=org_id)\n", - " kernel.add_chat_service(\"chat-gpt\", oai_chat_service)\n", - " kernel.add_text_embedding_generation_service(\"ada\", oai_text_embedding)\n", - "\n", - "kernel.register_memory_store(memory_store=sk.memory.VolatileMemoryStore())\n", - "kernel.import_skill(sk.core_skills.TextMemorySkill())" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "e7fefb6a", - "metadata": {}, - "source": [ - "At its core, Semantic Memory is a set of data structures that allow you to store the meaning of text that come from different data sources, and optionally to store the source text too. These texts can be from the web, e-mail providers, chats, a database, or from your local directory, and are hooked up to the Semantic Kernel through data source connectors.\n", - "\n", - "The texts are embedded or compressed into a vector of floats representing mathematically the texts' contents and meaning. You can read more about embeddings [here](https://aka.ms/sk/embeddings)." - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "2a7e7ca4", - "metadata": {}, - "source": [ - "### Manually adding memories\n", - "Let's create some initial memories \"About Me\". We can add memories to our `VolatileMemoryStore` by using `SaveInformationAsync`" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "d096504c", - "metadata": {}, - "outputs": [], - "source": [ - "async def populate_memory(kernel: sk.Kernel) -> None:\n", - " # Add some documents to the semantic memory\n", - " await kernel.memory.save_information_async(\n", - " collection=\"aboutMe\", id=\"info1\", text=\"My name is Andrea\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " collection=\"aboutMe\", id=\"info2\", text=\"I currently work as a tour guide\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " collection= \"aboutMe\", id=\"info3\", text=\"I've been living in Seattle since 2005\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " collection=\"aboutMe\", id=\"info4\", text=\"I visited France and Italy five times since 2015\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " collection=\"aboutMe\", id=\"info5\", text=\"My family is from New York\"\n", - " )" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "await populate_memory(kernel)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "2calf857", - "metadata": {}, - "source": [ - "Let's try searching the memory:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "628c843e", - "metadata": {}, - "outputs": [], - "source": [ - "async def search_memory_examples(kernel: sk.Kernel) -> None:\n", - " questions = [\n", - " \"what's my name\",\n", - " \"where do I live?\",\n", - " \"where's my family from?\",\n", - " \"where have I traveled?\",\n", - " \"what do I do for work\",\n", - " ]\n", - "\n", - " for question in questions:\n", - " print(f\"Question: {question}\")\n", - " result = await kernel.memory.search_async(\"aboutMe\", question)\n", - " print(f\"Answer: {result[0].text}\\n\")" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "await search_memory_examples(kernel)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "e70c2b22", - "metadata": {}, - "source": [ - "Let's now revisit the our chat sample from the [previous notebook](04-context-variables-chat.ipynb).\n", - "If you remember, we used context variables to fill the prompt with a `history` that continuously got populated as we chatted with the bot. Let's add also memory to it!" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "1ed54a32", - "metadata": {}, - "source": [ - "This is done by using the `TextMemorySkill` which exposes the `recall` native function.\n", - "\n", - "`recall` takes an input ask and performs a similarity search on the contents that have\n", - "been embedded in the Memory Store and returns the most relevant memory. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "fb8549b2", - "metadata": {}, - "outputs": [], - "source": [ - "async def setup_chat_with_memory(\n", - " kernel: sk.Kernel,\n", - ") -> Tuple[sk.SKFunctionBase, sk.SKContext]:\n", - " sk_prompt = \"\"\"\n", - " ChatBot can have a conversation with you about any topic.\n", - " It can give explicit instructions or say 'I don't know' if\n", - " it does not have an answer.\n", - "\n", - " Information about me, from previous conversations:\n", - " - {{$fact1}} {{recall $fact1}}\n", - " - {{$fact2}} {{recall $fact2}}\n", - " - {{$fact3}} {{recall $fact3}}\n", - " - {{$fact4}} {{recall $fact4}}\n", - " - {{$fact5}} {{recall $fact5}}\n", - "\n", - " Chat:\n", - " {{$chat_history}}\n", - " User: {{$user_input}}\n", - " ChatBot: \"\"\".strip()\n", - "\n", - " chat_func = kernel.create_semantic_function(sk_prompt, max_tokens=200, temperature=0.8)\n", - "\n", - " context = kernel.create_new_context()\n", - " context[\"fact1\"] = \"what is my name?\"\n", - " context[\"fact2\"] = \"where do I live?\"\n", - " context[\"fact3\"] = \"where's my family from?\"\n", - " context[\"fact4\"] = \"where have I traveled?\"\n", - " context[\"fact5\"] = \"what do I do for work?\"\n", - "\n", - " context[sk.core_skills.TextMemorySkill.COLLECTION_PARAM] = \"aboutMe\"\n", - " context[sk.core_skills.TextMemorySkill.RELEVANCE_PARAM] = \"0.8\"\n", - "\n", - " context[\"chat_history\"] = \"\"\n", - "\n", - " return chat_func, context" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "1ac62457", - "metadata": {}, - "source": [ - "The `RelevanceParam` is used in memory search and is a measure of the relevance score from 0.0 to 1.0, where 1.0 means a perfect match. We encourage users to experiment with different values." - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "645b55a1", - "metadata": {}, - "source": [ - "Now that we've included our memories, let's chat!" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "75267a2f", - "metadata": {}, - "outputs": [], - "source": [ - "async def chat(\n", - " kernel: sk.Kernel, chat_func: sk.SKFunctionBase, context: sk.SKContext\n", - ") -> bool:\n", - " try:\n", - " user_input = input(\"User:> \")\n", - " context[\"user_input\"] = user_input\n", - " print(f\"User:> {user_input}\")\n", - " except KeyboardInterrupt:\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - " except EOFError:\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - "\n", - " if user_input == \"exit\":\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - "\n", - " answer = await kernel.run_async(chat_func, input_vars=context.variables)\n", - " context[\"chat_history\"] += f\"\\nUser:> {user_input}\\nChatBot:> {answer}\\n\"\n", - "\n", - " print(f\"ChatBot:> {answer}\")\n", - " return True" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "e3875a34", - "metadata": {}, - "outputs": [], - "source": [ - "print(\"Populating memory...\")\n", - "await populate_memory(kernel)\n", - "\n", - "print(\"Asking questions... (manually)\")\n", - "await search_memory_examples(kernel)\n", - "\n", - "print(\"Setting up a chat (with memory!)\")\n", - "chat_func, context = await setup_chat_with_memory(kernel)\n", - "\n", - "print(\"Begin chatting (type 'exit' to exit):\\n\")\n", - "chatting = True\n", - "while chatting:\n", - " chatting = await chat(kernel, chat_func, context)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "0a51542b", - "metadata": {}, - "source": [ - "### Adding documents to your memory\n", - "\n", - "Many times in your applications you'll want to bring in external documents into your memory. Let's see how we can do this using our VolatileMemoryStore.\n", - "\n", - "Let's first get some data using some of the links in the Semantic Kernel repo." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "c3d5a1b9", - "metadata": {}, - "outputs": [], - "source": [ - "github_files ={}\n", - "github_files[\"https://github.com/microsoft/semantic-kernel/blob/main/README.md\"] = \\\n", - " \"README: Installation, getting started, and how to contribute\"\n", - "github_files[\"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/02-running-prompts-from-file.ipynb\"] = \\\n", - " \"Jupyter notebook describing how to pass prompts from a file to a semantic skill or function\"\n", - "github_files[\"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/00-getting-started.ipynb\"] = \\\n", - " \"Jupyter notebook describing how to get started with the Semantic Kernel\"\n", - "github_files[\"https://github.com/microsoft/semantic-kernel/tree/main/samples/skills/ChatSkill/ChatGPT\"] = \\\n", - " \"Sample demonstrating how to create a chat skill interfacing with ChatGPT\"\n", - "github_files[\"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/src/SemanticKernel/Memory/Volatile/VolatileMemoryStore.cs\"] = \\\n", - " \"C# class that defines a volatile embedding store\"" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "75f3ea5e", - "metadata": {}, - "source": [ - "Now let's add these files to our VolatileMemoryStore using `SaveReferenceAsync`. We'll separate these memories from the chat memories by putting them in a different collection." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "170e7142", - "metadata": {}, - "outputs": [], - "source": [ - "memory_collection_name = \"SKGitHub\"\n", - "print(\"Adding some GitHub file URLs and their descriptions to a volatile Semantic Memory.\");\n", - "i = 0\n", - "for entry, value in github_files.items():\n", - " await kernel.memory.save_reference_async(\n", - " collection=memory_collection_name,\n", - " description=value,\n", - " text=value,\n", - " external_id=entry,\n", - " external_source_name=\"GitHub\"\n", - " )\n", - " i += 1\n", - " print(\" URL {} saved\".format(i))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "143911c3", - "metadata": {}, - "outputs": [], - "source": [ - "ask = \"I love Jupyter notebooks, how should I get started?\"\n", - "print(\"===========================\\n\" + \"Query: \" + ask + \"\\n\")\n", - "\n", - "memories = await kernel.memory.search_async(memory_collection_name, ask, limit=5, min_relevance_score=0.77)\n", - "\n", - "i = 0\n", - "for memory in memories:\n", - " i += 1\n", - " print(f\"Result {i}:\")\n", - " print(\" URL: : \" + memory.id)\n", - " print(\" Title : \" + memory.description)\n", - " print(\" Relevance: \" + str(memory.relevance))\n", - " print()" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "id": "59294dac", - "metadata": {}, - "source": [ - "Now you might be wondering what happens if you have so much data that it doesn't fit into your RAM? That's where you want to make use of an external Vector Database made specifically for storing and retrieving embeddings. Fortunately, semantic kernel makes this easy thanks to an extensive list of available connectors. In the following section, we will connect to an existing Azure AI Search service that we will use as an external Vector Database to store and retrieve embeddings.\n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "from semantic_kernel.connectors.memory.azure_cognitive_search import AzureCognitiveSearchMemoryStore\n", - "\n", - "azure_ai_search_api_key, azure_ai_search_url = sk.azure_aisearch_settings_from_dot_env()\n", - "\n", - "#text-embedding-ada-002 uses a 1536-dimensional embedding vector\n", - "kernel.register_memory_store(\n", - " memory_store=AzureCognitiveSearchMemoryStore(\n", - " vector_size=1536,\n", - " search_endpoint=azure_ai_search_url,\n", - " admin_key=azure_ai_search_api_key\n", - " )\n", - ")\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "The implementation of Semantic Kernel allows to easily swap memory store for another. Here, we will re-use the functions we initially created for `VolatileMemoryStore` with our new external Vector Store leveraging Azure AI Search" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "await populate_memory(kernel)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We can see that our function created an \"About Me\" index and that our five pieces of information have been indexed (note that it can take a few minutes for the UI to reflect the document count and storage size)." - ] - }, - { - "attachments": { - "image.png": { - "image/png": "" - } - }, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "![image.png](attachment:image.png)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "And we can see that embeddings have been conveniently created to allow for semantic search." - ] - }, - { - "attachments": { - "image.png": { - "image/png": "" - } - }, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "![image.png](attachment:image.png)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Let's now try to query from Azure AI Search!" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "await search_memory_examples(kernel)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We have laid the foundation which will allow us to store an arbitrary amount of data in an external Vector Store above and beyond what could fit in memory at the expense of a little more latency." - ] + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "id": "68e1c158", + "metadata": {}, + "source": [ + "# Building Semantic Memory with Embeddings\n", + "\n", + "So far, we've mostly been treating the kernel as a stateless orchestration engine.\n", + "We send text into a model API and receive text out. \n", + "\n", + "In a [previous notebook](04-context-variables-chat.ipynb), we used `context variables` to pass in additional\n", + "text into prompts to enrich them with more context. This allowed us to create a basic chat experience. \n", + "\n", + "However, if you solely relied on context variables, you would quickly realize that eventually your prompt\n", + "would grow so large that you would run into the model's token limit. What we need is a way to persist state\n", + "and build both short-term and long-term memory to empower even more intelligent applications. \n", + "\n", + "To do this, we dive into the key concept of `Semantic Memory` in the Semantic Kernel. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a77bdf89", + "metadata": {}, + "outputs": [], + "source": [ + "!python -m pip install semantic-kernel==0.4.4.dev0" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "508ad44f", + "metadata": {}, + "outputs": [], + "source": [ + "from typing import Tuple\n", + "\n", + "import semantic_kernel as sk\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " OpenAIChatCompletion,\n", + " OpenAITextEmbedding,\n", + " AzureChatCompletion,\n", + " AzureTextEmbedding,\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "d8ddffc1", + "metadata": {}, + "source": [ + "In order to use memory, we need to instantiate the Kernel with a Memory Storage\n", + "and an Embedding service. In this example, we make use of the `VolatileMemoryStore` which can be thought of as a temporary in-memory storage. This memory is not written to disk and is only available during the app session.\n", + "\n", + "When developing your app you will have the option to plug in persistent storage like Azure AI Search, Azure Cosmos Db, PostgreSQL, SQLite, etc. Semantic Memory allows also to index external data sources, without duplicating all the information as you will see further down in this notebook." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8f8dcbc6", + "metadata": {}, + "outputs": [], + "source": [ + "kernel = sk.Kernel()\n", + "\n", + "useAzureOpenAI = False\n", + "\n", + "# Configure AI service used by the kernel\n", + "if useAzureOpenAI:\n", + " deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", + " # next line assumes chat deployment name is \"turbo\", adjust the deployment name to the value of your chat model if needed\n", + " azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key)\n", + " # next line assumes embeddings deployment name is \"text-embedding\", adjust the deployment name to the value of your chat model if needed\n", + " azure_text_embedding = AzureTextEmbedding(deployment_name=\"text-embedding\", endpoint=endpoint, api_key=api_key)\n", + " kernel.add_chat_service(\"chat_completion\", azure_chat_service)\n", + " kernel.add_text_embedding_generation_service(\"ada\", azure_text_embedding)\n", + "else:\n", + " api_key, org_id = sk.openai_settings_from_dot_env()\n", + " oai_chat_service = OpenAIChatCompletion(ai_model_id=\"gpt-3.5-turbo\", api_key=api_key, org_id=org_id)\n", + " oai_text_embedding = OpenAITextEmbedding(ai_model_id=\"text-embedding-ada-002\", api_key=api_key, org_id=org_id)\n", + " kernel.add_chat_service(\"chat-gpt\", oai_chat_service)\n", + " kernel.add_text_embedding_generation_service(\"ada\", oai_text_embedding)\n", + "\n", + "kernel.register_memory_store(memory_store=sk.memory.VolatileMemoryStore())\n", + "kernel.import_skill(sk.core_skills.TextMemorySkill())" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "e7fefb6a", + "metadata": {}, + "source": [ + "At its core, Semantic Memory is a set of data structures that allow you to store the meaning of text that come from different data sources, and optionally to store the source text too. These texts can be from the web, e-mail providers, chats, a database, or from your local directory, and are hooked up to the Semantic Kernel through data source connectors.\n", + "\n", + "The texts are embedded or compressed into a vector of floats representing mathematically the texts' contents and meaning. You can read more about embeddings [here](https://aka.ms/sk/embeddings)." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "2a7e7ca4", + "metadata": {}, + "source": [ + "### Manually adding memories\n", + "Let's create some initial memories \"About Me\". We can add memories to our `VolatileMemoryStore` by using `SaveInformationAsync`" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d096504c", + "metadata": {}, + "outputs": [], + "source": [ + "async def populate_memory(kernel: sk.Kernel) -> None:\n", + " # Add some documents to the semantic memory\n", + " await kernel.memory.save_information_async(collection=\"aboutMe\", id=\"info1\", text=\"My name is Andrea\")\n", + " await kernel.memory.save_information_async(\n", + " collection=\"aboutMe\", id=\"info2\", text=\"I currently work as a tour guide\"\n", + " )\n", + " await kernel.memory.save_information_async(\n", + " collection=\"aboutMe\", id=\"info3\", text=\"I've been living in Seattle since 2005\"\n", + " )\n", + " await kernel.memory.save_information_async(\n", + " collection=\"aboutMe\",\n", + " id=\"info4\",\n", + " text=\"I visited France and Italy five times since 2015\",\n", + " )\n", + " await kernel.memory.save_information_async(collection=\"aboutMe\", id=\"info5\", text=\"My family is from New York\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "await populate_memory(kernel)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "2calf857", + "metadata": {}, + "source": [ + "Let's try searching the memory:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "628c843e", + "metadata": {}, + "outputs": [], + "source": [ + "async def search_memory_examples(kernel: sk.Kernel) -> None:\n", + " questions = [\n", + " \"what's my name\",\n", + " \"where do I live?\",\n", + " \"where's my family from?\",\n", + " \"where have I traveled?\",\n", + " \"what do I do for work\",\n", + " ]\n", + "\n", + " for question in questions:\n", + " print(f\"Question: {question}\")\n", + " result = await kernel.memory.search_async(\"aboutMe\", question)\n", + " print(f\"Answer: {result[0].text}\\n\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "await search_memory_examples(kernel)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "e70c2b22", + "metadata": {}, + "source": [ + "Let's now revisit the our chat sample from the [previous notebook](04-context-variables-chat.ipynb).\n", + "If you remember, we used context variables to fill the prompt with a `history` that continuously got populated as we chatted with the bot. Let's add also memory to it!" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "1ed54a32", + "metadata": {}, + "source": [ + "This is done by using the `TextMemorySkill` which exposes the `recall` native function.\n", + "\n", + "`recall` takes an input ask and performs a similarity search on the contents that have\n", + "been embedded in the Memory Store and returns the most relevant memory. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "fb8549b2", + "metadata": {}, + "outputs": [], + "source": [ + "async def setup_chat_with_memory(\n", + " kernel: sk.Kernel,\n", + ") -> Tuple[sk.SKFunctionBase, sk.SKContext]:\n", + " sk_prompt = \"\"\"\n", + " ChatBot can have a conversation with you about any topic.\n", + " It can give explicit instructions or say 'I don't know' if\n", + " it does not have an answer.\n", + "\n", + " Information about me, from previous conversations:\n", + " - {{$fact1}} {{recall $fact1}}\n", + " - {{$fact2}} {{recall $fact2}}\n", + " - {{$fact3}} {{recall $fact3}}\n", + " - {{$fact4}} {{recall $fact4}}\n", + " - {{$fact5}} {{recall $fact5}}\n", + "\n", + " Chat:\n", + " {{$chat_history}}\n", + " User: {{$user_input}}\n", + " ChatBot: \"\"\".strip()\n", + "\n", + " chat_func = kernel.create_semantic_function(sk_prompt, max_tokens=200, temperature=0.8)\n", + "\n", + " context = kernel.create_new_context()\n", + " context[\"fact1\"] = \"what is my name?\"\n", + " context[\"fact2\"] = \"where do I live?\"\n", + " context[\"fact3\"] = \"where's my family from?\"\n", + " context[\"fact4\"] = \"where have I traveled?\"\n", + " context[\"fact5\"] = \"what do I do for work?\"\n", + "\n", + " context[sk.core_skills.TextMemorySkill.COLLECTION_PARAM] = \"aboutMe\"\n", + " context[sk.core_skills.TextMemorySkill.RELEVANCE_PARAM] = \"0.8\"\n", + "\n", + " context[\"chat_history\"] = \"\"\n", + "\n", + " return chat_func, context" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "1ac62457", + "metadata": {}, + "source": [ + "The `RelevanceParam` is used in memory search and is a measure of the relevance score from 0.0 to 1.0, where 1.0 means a perfect match. We encourage users to experiment with different values." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "645b55a1", + "metadata": {}, + "source": [ + "Now that we've included our memories, let's chat!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "75267a2f", + "metadata": {}, + "outputs": [], + "source": [ + "async def chat(kernel: sk.Kernel, chat_func: sk.SKFunctionBase, context: sk.SKContext) -> bool:\n", + " try:\n", + " user_input = input(\"User:> \")\n", + " context[\"user_input\"] = user_input\n", + " print(f\"User:> {user_input}\")\n", + " except KeyboardInterrupt:\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + " except EOFError:\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + "\n", + " if user_input == \"exit\":\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + "\n", + " answer = await kernel.run_async(chat_func, input_vars=context.variables)\n", + " context[\"chat_history\"] += f\"\\nUser:> {user_input}\\nChatBot:> {answer}\\n\"\n", + "\n", + " print(f\"ChatBot:> {answer}\")\n", + " return True" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e3875a34", + "metadata": {}, + "outputs": [], + "source": [ + "print(\"Populating memory...\")\n", + "await populate_memory(kernel)\n", + "\n", + "print(\"Asking questions... (manually)\")\n", + "await search_memory_examples(kernel)\n", + "\n", + "print(\"Setting up a chat (with memory!)\")\n", + "chat_func, context = await setup_chat_with_memory(kernel)\n", + "\n", + "print(\"Begin chatting (type 'exit' to exit):\\n\")\n", + "chatting = True\n", + "while chatting:\n", + " chatting = await chat(kernel, chat_func, context)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "0a51542b", + "metadata": {}, + "source": [ + "### Adding documents to your memory\n", + "\n", + "Many times in your applications you'll want to bring in external documents into your memory. Let's see how we can do this using our VolatileMemoryStore.\n", + "\n", + "Let's first get some data using some of the links in the Semantic Kernel repo." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c3d5a1b9", + "metadata": {}, + "outputs": [], + "source": [ + "github_files = {}\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/README.md\"\n", + "] = \"README: Installation, getting started, and how to contribute\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/02-running-prompts-from-file.ipynb\"\n", + "] = \"Jupyter notebook describing how to pass prompts from a file to a semantic skill or function\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/00-getting-started.ipynb\"\n", + "] = \"Jupyter notebook describing how to get started with the Semantic Kernel\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/tree/main/samples/skills/ChatSkill/ChatGPT\"\n", + "] = \"Sample demonstrating how to create a chat skill interfacing with ChatGPT\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/src/SemanticKernel/Memory/Volatile/VolatileMemoryStore.cs\"\n", + "] = \"C# class that defines a volatile embedding store\"" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "75f3ea5e", + "metadata": {}, + "source": [ + "Now let's add these files to our VolatileMemoryStore using `SaveReferenceAsync`. We'll separate these memories from the chat memories by putting them in a different collection." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "170e7142", + "metadata": {}, + "outputs": [], + "source": [ + "memory_collection_name = \"SKGitHub\"\n", + "print(\"Adding some GitHub file URLs and their descriptions to a volatile Semantic Memory.\")\n", + "i = 0\n", + "for entry, value in github_files.items():\n", + " await kernel.memory.save_reference_async(\n", + " collection=memory_collection_name,\n", + " description=value,\n", + " text=value,\n", + " external_id=entry,\n", + " external_source_name=\"GitHub\",\n", + " )\n", + " i += 1\n", + " print(\" URL {} saved\".format(i))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "143911c3", + "metadata": {}, + "outputs": [], + "source": [ + "ask = \"I love Jupyter notebooks, how should I get started?\"\n", + "print(\"===========================\\n\" + \"Query: \" + ask + \"\\n\")\n", + "\n", + "memories = await kernel.memory.search_async(memory_collection_name, ask, limit=5, min_relevance_score=0.77)\n", + "\n", + "i = 0\n", + "for memory in memories:\n", + " i += 1\n", + " print(f\"Result {i}:\")\n", + " print(\" URL: : \" + memory.id)\n", + " print(\" Title : \" + memory.description)\n", + " print(\" Relevance: \" + str(memory.relevance))\n", + " print()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "59294dac", + "metadata": {}, + "source": [ + "Now you might be wondering what happens if you have so much data that it doesn't fit into your RAM? That's where you want to make use of an external Vector Database made specifically for storing and retrieving embeddings. Fortunately, semantic kernel makes this easy thanks to an extensive list of available connectors. In the following section, we will connect to an existing Azure AI Search service that we will use as an external Vector Database to store and retrieve embeddings.\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from semantic_kernel.connectors.memory.azure_cognitive_search import (\n", + " AzureCognitiveSearchMemoryStore,\n", + ")\n", + "\n", + "azure_ai_search_api_key, azure_ai_search_url = sk.azure_aisearch_settings_from_dot_env()\n", + "\n", + "# text-embedding-ada-002 uses a 1536-dimensional embedding vector\n", + "kernel.register_memory_store(\n", + " memory_store=AzureCognitiveSearchMemoryStore(\n", + " vector_size=1536,\n", + " search_endpoint=azure_ai_search_url,\n", + " admin_key=azure_ai_search_api_key,\n", + " )\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The implementation of Semantic Kernel allows to easily swap memory store for another. Here, we will re-use the functions we initially created for `VolatileMemoryStore` with our new external Vector Store leveraging Azure AI Search" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "await populate_memory(kernel)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can see that our function created an \"About Me\" index and that our five pieces of information have been indexed (note that it can take a few minutes for the UI to reflect the document count and storage size)." + ] + }, + { + "attachments": { + "image.png": { + "image/png": "" } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.10.12" + }, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "![image.png](attachment:image.png)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "And we can see that embeddings have been conveniently created to allow for semantic search." + ] + }, + { + "attachments": { + "image.png": { + "image/png": "" } + }, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "![image.png](attachment:image.png)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's now try to query from Azure AI Search!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "await search_memory_examples(kernel)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We have laid the foundation which will allow us to store an arbitrary amount of data in an external Vector Store above and beyond what could fit in memory at the expense of a little more latency." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" }, - "nbformat": 4, - "nbformat_minor": 5 + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 } diff --git a/python/notebooks/07-hugging-face-for-skills.ipynb b/python/notebooks/07-hugging-face-for-skills.ipynb index d49f171b583e..c4ce3fb2d49a 100644 --- a/python/notebooks/07-hugging-face-for-skills.ipynb +++ b/python/notebooks/07-hugging-face-for-skills.ipynb @@ -20,7 +20,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0\n", + "!python -m pip install semantic-kernel==0.4.4.dev0\n", "\n", "# Note that additional dependencies are required for the Hugging Face connectors:\n", "!python -m pip install torch==2.0.0\n", @@ -184,7 +184,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/08-native-function-inline.ipynb b/python/notebooks/08-native-function-inline.ipynb index ced7bd6f9317..588cde44659a 100644 --- a/python/notebooks/08-native-function-inline.ipynb +++ b/python/notebooks/08-native-function-inline.ipynb @@ -46,7 +46,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -576,7 +576,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/09-groundedness-checking.ipynb b/python/notebooks/09-groundedness-checking.ipynb index 30a0c6ca80f0..cf9cbeed18c2 100644 --- a/python/notebooks/09-groundedness-checking.ipynb +++ b/python/notebooks/09-groundedness-checking.ipynb @@ -81,7 +81,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -352,7 +352,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.3" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/10-multiple-results-per-prompt.ipynb b/python/notebooks/10-multiple-results-per-prompt.ipynb index 082078b62cc2..5ad8b068e24e 100644 --- a/python/notebooks/10-multiple-results-per-prompt.ipynb +++ b/python/notebooks/10-multiple-results-per-prompt.ipynb @@ -25,7 +25,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -36,7 +36,13 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai import ChatRequestSettings, CompleteRequestSettings\n", + "from semantic_kernel.connectors.ai.open_ai.request_settings.open_ai_request_settings import (\n", + " OpenAITextRequestSettings,\n", + " OpenAIChatRequestSettings,\n", + ")\n", + "from semantic_kernel.connectors.ai.open_ai.request_settings.azure_chat_request_settings import (\n", + " AzureChatRequestSettings\n", + ")\n", "from semantic_kernel.connectors.ai.open_ai import AzureTextCompletion, AzureChatCompletion, OpenAITextCompletion, OpenAIChatCompletion\n", "from semantic_kernel.connectors.ai.hugging_face import HuggingFaceTextCompletion" ] @@ -61,9 +67,8 @@ "\n", "# Configure Azure LLM service\n", "deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - "azure_text_service = AzureTextCompletion(deployment_name=\"text\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your text model\n", - "azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your chat model\n", - "\n", + "azure_text_service = AzureTextCompletion(deployment_name=\"text-davinci-003\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your text model\n", + "azure_chat_service = AzureChatCompletion(deployment_name=\"gpt-35-turbo\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your chat model\n", "\n", "# Configure OpenAI service\n", "api_key, org_id = sk.openai_settings_from_dot_env()\n", @@ -90,14 +95,7 @@ "metadata": {}, "outputs": [], "source": [ - "request_settings = CompleteRequestSettings(\n", - " max_tokens=80,\n", - " temperature=0.7,\n", - " top_p=1,\n", - " frequency_penalty=0.5,\n", - " presence_penalty=0.5,\n", - " number_of_responses=3\n", - ")" + "oai_text_request_settings = OpenAITextRequestSettings(extension_data = { \"max_tokens\": 80, \"temperature\": 0.7, \"top_p\": 1, \"frequency_penalty\": 0.5, \"presence_penalty\": 0.5, \"number_of_responses\": 3})" ] }, { @@ -117,7 +115,7 @@ "outputs": [], "source": [ "prompt = \"what is the purpose of a rubber duck?\"\n", - "results = await oai_text_service.complete_async(prompt=prompt, settings=request_settings)\n", + "results = await oai_text_service.complete_async(prompt=prompt, settings=oai_text_request_settings)\n", "i = 1\n", "for result in results:\n", " print(f\"Result {i}: {result}\")\n", @@ -141,7 +139,7 @@ "outputs": [], "source": [ "prompt = \"provide me a list of possible meanings for the acronym 'ORLD'\"\n", - "results = await azure_text_service.complete_async(prompt=prompt, settings=request_settings)\n", + "results = await azure_text_service.complete_async(prompt=prompt, settings=oai_text_request_settings)\n", "i = 1\n", "for result in results:\n", " print(f\"Result {i}: {result}\")\n", @@ -157,6 +155,20 @@ "## Multiple Hugging Face Text Completions" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "4a148709", + "metadata": {}, + "outputs": [], + "source": [ + "from semantic_kernel.connectors.ai.hugging_face.hf_request_settings import (\n", + " HuggingFaceRequestSettings,\n", + ")\n", + "\n", + "hf_request_settings = HuggingFaceRequestSettings(extension_data = { \"max_new_tokens\": 80, \"temperature\": 0.7, \"top_p\": 1})" + ] + }, { "cell_type": "code", "execution_count": null, @@ -165,11 +177,8 @@ "outputs": [], "source": [ "prompt = \"The purpose of a rubber duck is\"\n", - "results = await hf_text_service.complete_async(prompt=prompt, request_settings=request_settings)\n", - "i = 1\n", - "for result in results:\n", - " print(f\"Result {i}: {result}\")\n", - " i += 1" + "results = await hf_text_service.complete_async(prompt=prompt, request_settings=hf_request_settings)\n", + "print(\"\".join(results))" ] }, { @@ -188,7 +197,7 @@ "metadata": {}, "outputs": [], "source": [ - "chat_request_settings = ChatRequestSettings(\n", + "oai_chat_request_settings = OpenAIChatRequestSettings(\n", " max_tokens=80,\n", " temperature=0.7,\n", " top_p=1,\n", @@ -217,10 +226,10 @@ "role = \"user\"\n", "content = \"It's a beautiful day outside, birds are singing, flowers are blooming. On days like these, kids like you...\"\n", "message = { \"role\":role, \"content\":content }\n", - "results = await oai_chat_service.complete_chat_async(messages=[message], settings=chat_request_settings)\n", + "results = await oai_chat_service.complete_chat_async(messages=[message], settings=oai_chat_request_settings)\n", "i = 0\n", "for result in results:\n", - " print(f\"Result {i}: {result}\")\n", + " print(f\"Result {i}: {result[0]}\")\n", " i += 1" ] }, @@ -233,6 +242,23 @@ "## Multiple Azure OpenAI Chat Completions" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "66ba4767", + "metadata": {}, + "outputs": [], + "source": [ + "az_oai_request_settings = AzureChatRequestSettings(\n", + " max_tokens=80,\n", + " temperature=0.7,\n", + " top_p=1,\n", + " frequency_penalty=0.5,\n", + " presence_penalty=0.5,\n", + " number_of_responses=3\n", + ")" + ] + }, { "cell_type": "code", "execution_count": null, @@ -243,10 +269,10 @@ "role = \"user\"\n", "content = \"Tomorow is going to be a great day, I can feel it. I'm going to wake up early, go for a run, and then...\"\n", "message = { \"role\":role, \"content\":content }\n", - "results = await azure_chat_service.complete_chat_async(messages=[message], settings=chat_request_settings)\n", + "results = await azure_chat_service.complete_chat_async(messages=[message], settings=az_oai_request_settings)\n", "i = 0\n", "for result in results:\n", - " print(f\"Result {i}: {result}\")\n", + " print(f\"Result {i}: {result[0]}\")\n", " i += 1" ] }, @@ -270,24 +296,39 @@ "source": [ "import os\n", "from IPython.display import clear_output\n", + "import time\n", "\n", - "if os.name == \"nt\":\n", - " clear = \"cls\"\n", - "else:\n", - " clear = \"clear\"\n", + "# Determine the clear command based on OS\n", + "clear_command = \"cls\" if os.name == \"nt\" else \"clear\"\n", "\n", "prompt = \"what is the purpose of a rubber duck?\"\n", - "stream = oai_text_service.complete_stream_async(prompt=prompt, settings=request_settings)\n", - "texts = [\"\"] * request_settings.number_of_responses\n", + "stream = oai_text_service.complete_stream_async(prompt=prompt, settings=oai_text_request_settings)\n", + "number_of_responses = oai_text_request_settings.number_of_responses\n", + "texts = [\"\"] * number_of_responses\n", + "\n", + "last_clear_time = time.time()\n", + "clear_interval = 0.5 # seconds\n", + "\n", + "# Note: there are some quirks with displaying the output, which sometimes flashes and disappears.\n", + "# This could be influenced by a few factors specific to Jupyter notebooks and asynchronous processing.\n", + "# The following code attempts to buffer the results to avoid the output flashing on/off the screen.\n", + "\n", "async for results in stream:\n", - " i = 1\n", - " clear_output(wait=True)\n", - " for result in results:\n", - " texts[i - 1] += result\n", - " print(f\"Result {i}: {texts[i - 1]}\")\n", - " i += 1\n", + " current_time = time.time()\n", + "\n", + " # Update texts with new results\n", + " for idx, result in enumerate(results):\n", + " if idx < number_of_responses:\n", + " texts[idx] += result\n", + "\n", + " # Clear and display output at intervals\n", + " if current_time - last_clear_time > clear_interval:\n", + " clear_output(wait=True)\n", + " for idx, text in enumerate(texts):\n", + " print(f\"Result {idx + 1}: {text}\")\n", + " last_clear_time = current_time\n", "\n", - "print(\"----------------------------------------\")\n" + "print(\"----------------------------------------\")" ] } ], @@ -307,7 +348,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/11-streaming-completions.ipynb b/python/notebooks/11-streaming-completions.ipynb index 36cd540cba7e..3a9c409e1d08 100644 --- a/python/notebooks/11-streaming-completions.ipynb +++ b/python/notebooks/11-streaming-completions.ipynb @@ -16,7 +16,7 @@ "metadata": {}, "outputs": [], "source": [ - "!python -m pip install semantic-kernel==0.4.3.dev0" + "!python -m pip install semantic-kernel==0.4.4.dev0" ] }, { @@ -27,8 +27,19 @@ "outputs": [], "source": [ "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai import ChatRequestSettings, CompleteRequestSettings\n", - "from semantic_kernel.connectors.ai.open_ai import AzureTextCompletion, AzureChatCompletion, OpenAITextCompletion, OpenAIChatCompletion\n", + "from semantic_kernel.connectors.ai.open_ai.request_settings.open_ai_request_settings import (\n", + " OpenAITextRequestSettings,\n", + " OpenAIChatRequestSettings,\n", + ")\n", + "from semantic_kernel.connectors.ai.open_ai.request_settings.azure_chat_request_settings import (\n", + " AzureChatRequestSettings,\n", + ")\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " AzureTextCompletion,\n", + " AzureChatCompletion,\n", + " OpenAITextCompletion,\n", + " OpenAIChatCompletion,\n", + ")\n", "from semantic_kernel.connectors.ai.hugging_face import HuggingFaceTextCompletion" ] }, @@ -52,8 +63,12 @@ "\n", "# Configure Azure LLM service\n", "deployment, api_key, endpoint = sk.azure_openai_settings_from_dot_env()\n", - "azure_text_service = AzureTextCompletion(deployment_name=\"text\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your text model\n", - "azure_chat_service = AzureChatCompletion(deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key) # set the deployment name to the value of your chat model\n", + "azure_text_service = AzureTextCompletion(\n", + " deployment_name=\"text\", endpoint=endpoint, api_key=api_key\n", + ") # set the deployment name to the value of your text model\n", + "azure_chat_service = AzureChatCompletion(\n", + " deployment_name=\"turbo\", endpoint=endpoint, api_key=api_key\n", + ") # set the deployment name to the value of your chat model\n", "\n", "# Configure OpenAI service\n", "api_key, org_id = sk.openai_settings_from_dot_env()\n", @@ -80,12 +95,12 @@ "metadata": {}, "outputs": [], "source": [ - "request_settings = CompleteRequestSettings(\n", + "oai_request_settings = OpenAITextRequestSettings(\n", " max_tokens=150,\n", " temperature=0.7,\n", " top_p=1,\n", " frequency_penalty=0.5,\n", - " presence_penalty=0.5\n", + " presence_penalty=0.5,\n", ")" ] }, @@ -106,9 +121,9 @@ "outputs": [], "source": [ "prompt = \"what is the purpose of a rubber duck?\"\n", - "stream = oai_text_service.complete_stream_async(prompt=prompt, settings=request_settings)\n", + "stream = oai_text_service.complete_stream_async(prompt=prompt, settings=oai_request_settings)\n", "async for text in stream:\n", - " print(text, end = \"\") # end = \"\" to avoid newlines" + " print(text, end=\"\") # end = \"\" to avoid newlines" ] }, { @@ -128,9 +143,9 @@ "outputs": [], "source": [ "prompt = \"provide me a list of possible meanings for the acronym 'ORLD'\"\n", - "stream = azure_text_service.complete_stream_async(prompt=prompt, settings=request_settings)\n", + "stream = azure_text_service.complete_stream_async(prompt=prompt, settings=oai_request_settings)\n", "async for text in stream:\n", - " print(text, end = \"\") # end = \"\" to avoid newlines" + " print(text, end=\"\") # end = \"\" to avoid newlines" ] }, { @@ -142,6 +157,27 @@ "## Streaming Hugging Face Text Completion" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "be7b1c2e", + "metadata": {}, + "outputs": [], + "source": [ + "from semantic_kernel.connectors.ai.hugging_face.hf_request_settings import (\n", + " HuggingFaceRequestSettings,\n", + ")\n", + "\n", + "hf_request_settings = HuggingFaceRequestSettings(\n", + " extension_data={\n", + " \"max_new_tokens\": 80,\n", + " \"top_p\": 1,\n", + " \"eos_token_id\": 11,\n", + " \"pad_token_id\": 0,\n", + " }\n", + ")" + ] + }, { "cell_type": "code", "execution_count": null, @@ -150,9 +186,9 @@ "outputs": [], "source": [ "prompt = \"The purpose of a rubber duck is\"\n", - "stream = hf_text_service.complete_stream_async(prompt=prompt, request_settings=request_settings)\n", + "stream = hf_text_service.complete_stream_async(prompt=prompt, request_settings=hf_request_settings)\n", "async for text in stream:\n", - " print(text, end = \"\") # end = \"\" to avoid newlines" + " print(text, end=\"\") # end = \"\" to avoid newlines" ] }, { @@ -171,7 +207,7 @@ "metadata": {}, "outputs": [], "source": [ - "chat_request_settings = ChatRequestSettings(\n", + "oai_chat_request_settings = OpenAIChatRequestSettings(\n", " max_tokens=150,\n", " temperature=0.7,\n", " top_p=1,\n", @@ -198,10 +234,10 @@ "source": [ "role = \"system\"\n", "content = \"You are an AI assistant that helps people find information.\"\n", - "message = { \"role\":role, \"content\":content }\n", - "stream = oai_chat_service.complete_chat_stream_async(messages=[message], settings=chat_request_settings)\n", + "message = {\"role\": role, \"content\": content}\n", + "stream = oai_chat_service.complete_chat_stream_async(messages=[message], settings=oai_chat_request_settings)\n", "async for text in stream:\n", - " print(text, end = \"\") # end = \"\" to avoid newlines" + " print(text, end=\"\") # end = \"\" to avoid newlines" ] }, { @@ -213,6 +249,22 @@ "## Streaming Azure OpenAI Chat Completion" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "da1e9f59", + "metadata": {}, + "outputs": [], + "source": [ + "az_oai_chat_request_settings = AzureChatRequestSettings(\n", + " max_tokens=150,\n", + " temperature=0.7,\n", + " top_p=1,\n", + " frequency_penalty=0.5,\n", + " presence_penalty=0.5,\n", + ")" + ] + }, { "cell_type": "code", "execution_count": null, @@ -222,10 +274,10 @@ "source": [ "role = \"system\"\n", "content = \"You are an AI assistant that helps people find information.\"\n", - "message = { \"role\":role, \"content\":content }\n", - "stream = azure_chat_service.complete_chat_stream_async(messages=[message], settings=chat_request_settings)\n", + "message = {\"role\": role, \"content\": content}\n", + "stream = azure_chat_service.complete_chat_stream_async(messages=[message], settings=az_oai_chat_request_settings)\n", "async for text in stream:\n", - " print(text, end = \"\") # end = \"\" to avoid newlines" + " print(text, end=\"\") # end = \"\" to avoid newlines" ] } ], @@ -245,7 +297,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.6" + "version": "3.10.12" } }, "nbformat": 4, diff --git a/python/notebooks/third_party/weaviate-persistent-memory.ipynb b/python/notebooks/third_party/weaviate-persistent-memory.ipynb index 90ef285bb7c4..da708da4ddb0 100644 --- a/python/notebooks/third_party/weaviate-persistent-memory.ipynb +++ b/python/notebooks/third_party/weaviate-persistent-memory.ipynb @@ -1,530 +1,510 @@ { - "cells": [ - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Introduction" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "This notebook shows how to replace the `VolatileMemoryStore` memory storage used in a [previous notebook](./06-memory-and-embeddings.ipynb) with a `WeaviateMemoryStore`.\n", - "\n", - "`WeaviateMemoryStore` is an example of a persistent (i.e. long-term) memory store backed by the Weaviate vector database." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# About Weaviate" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "[Weaviate](https://weaviate.io/) is an open-source vector database designed to scale seamlessly into billions of data objects. This implementation supports hybrid search out-of-the-box (meaning it will perform better for keyword searches)." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can run Weaviate in 5 ways:\n", - "\n", - "- **SaaS** – with [Weaviate Cloud Services (WCS)](https://weaviate.io/pricing).\n", - "\n", - " WCS is a fully managed service that takes care of hosting, scaling, and updating your Weaviate instance. You can try it out for free with a sandbox that lasts for 14 days.\n", - "\n", - " To set up a SaaS Weaviate instance with WCS:\n", - "\n", - " 1. Navigate to [Weaviate Cloud Console](https://console.weaviate.cloud/).\n", - " 2. Register or sign in to your WCS account.\n", - " 3. Create a new cluster with the following settings:\n", - " - `Subscription Tier` – Free sandbox for a free trial, or contact [hello@weaviate.io](mailto:hello@weaviate.io) for other options.\n", - " - `Cluster name` – a unique name for your cluster. The name will become part of the URL used to access this instance.\n", - " - `Enable Authentication?` – Enabled by default. This will generate a static API key that you can use to authenticate.\n", - " 4. Wait for a few minutes until your cluster is ready. You will see a green tick ✔️ when it's done. Copy your cluster URL.\n", - "\n", - "- **Hybrid SaaS**\n", - "\n", - " > If you need to keep your data on-premise for security or compliance reasons, Weaviate also offers a Hybrid SaaS option: Weaviate runs within your cloud instances, but the cluster is managed remotely by Weaviate. This gives you the benefits of a managed service without sending data to an external party.\n", - "\n", - " The Weaviate Hybrid SaaS is a custom solution. If you are interested in this option, please reach out to [hello@weaviate.io](mailto:hello@weaviate.io).\n", - "\n", - "- **Self-hosted** – with a Docker container\n", - "\n", - " To set up a Weaviate instance with Docker:\n", - "\n", - " 1. [Install Docker](https://docs.docker.com/engine/install/) on your local machine if it is not already installed.\n", - " 2. [Install the Docker Compose Plugin](https://docs.docker.com/compose/install/)\n", - " 3. Download a `docker-compose.yml` file with this `curl` command:\n", - "\n", - " ```\n", - " curl -o docker-compose.yml \"https://configuration.weaviate.io/v2/docker-compose/docker-compose.yml?modules=standalone&runtime=docker-compose&weaviate_version=v1.19.6\"\n", - " ```\n", - "\n", - " Alternatively, you can use Weaviate's docker compose [configuration tool](https://weaviate.io/developers/weaviate/installation/docker-compose) to generate your own `docker-compose.yml` file.\n", - "\n", - " 4. Run `docker compose up -d` to spin up a Weaviate instance.\n", - "\n", - " > To shut it down, run `docker compose down`.\n", - "\n", - "- **Self-hosted** – with a Kubernetes cluster\n", - "\n", - " To configure a self-hosted instance with Kubernetes, follow Weaviate's [documentation](https://weaviate.io/developers/weaviate/installation/kubernetes).|\n", - "\n", - "- **Embedded** - start a weaviate instance right from your application code using the client library\n", - " \n", - " This code snippet shows how to instantiate an embedded weaviate instance and upload a document:\n", - "\n", - " ```python\n", - " import weaviate\n", - " from weaviate.embedded import EmbeddedOptions\n", - "\n", - " client = weaviate.Client(\n", - " embedded_options=EmbeddedOptions()\n", - " )\n", - "\n", - " data_obj = {\n", - " \"name\": \"Chardonnay\",\n", - " \"description\": \"Goes with fish\"\n", - " }\n", - "\n", - " client.data_object.create(data_obj, \"Wine\")\n", - " ```\n", - " \n", - " Refer to the [documentation](https://weaviate.io/developers/weaviate/installation/embedded) for more details about this deployment method." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Setup" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "!pip install semantic-kernel==0.3.8.dev0\n", - "!pip install weaviate-client\n", - "!pip install python-dotenv" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## OS-specific notes:\n", - "* if you run into SSL errors when connecting to OpenAI on macOS, see this issue for a [potential solution](https://github.com/microsoft/semantic-kernel/issues/627#issuecomment-1580912248)\n", - "* on Windows, you may need to run Docker Desktop as administrator" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "from typing import Tuple\n", - "\n", - "import semantic_kernel as sk\n", - "from semantic_kernel.connectors.ai.open_ai import (\n", - " OpenAIChatCompletion,\n", - " OpenAITextEmbedding,\n", - ")\n", - "\n", - "import os" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "First, we instantiate the Weaviate memory store. Uncomment ONE of the options below, depending on how you want to use Weaviate:\n", - "* from a Docker instance\n", - "* from WCS\n", - "* directly from the client (embedded Weaviate), which works on Linux only at the moment" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "from semantic_kernel.connectors.memory.weaviate import weaviate_memory_store\n", - "from dotenv import load_dotenv\n", - "\n", - "load_dotenv(override=True)\n", - "\n", - "# Using Docker\n", - "config = weaviate_memory_store.WeaviateConfig(url=\"http://localhost:8080\")\n", - "\n", - "# Using WCS. Make sure the environment variables `WEAVIATE_URL` and `WEAVIATE_API_KEY`\n", - "# were set in the `.env` file.\n", - "#\n", - "#weaviate_api, weaviate_url = sk.weaviate_settings_from_dot_env()\n", - "#\n", - "#config = weaviate_memory_store.WeaviateConfig(\n", - "# url=weaviate_url,\n", - "# api_key=weaviate_api\n", - "#)\n", - "\n", - "# Using Embedded Weaviate\n", - "#config = weaviate_memory_store.WeaviateConfig(use_embed=True)\n", - "\n", - "store = weaviate_memory_store.WeaviateMemoryStore(config=config)\n", - "store.client.schema.delete_all()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Then, we register the memory store to the kernel:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "kernel = sk.Kernel()\n", - "\n", - "api_key, org_id = sk.openai_settings_from_dot_env()\n", - "kernel.add_chat_service(\n", - " \"chat-gpt\", OpenAIChatCompletion(\"gpt-3.5-turbo\", api_key, org_id)\n", - ")\n", - "kernel.add_text_embedding_generation_service(\n", - " \"ada\", OpenAITextEmbedding(\"text-embedding-ada-002\", api_key, org_id)\n", - ")\n", - "\n", - "kernel.register_memory_store(memory_store=store)\n", - "kernel.import_skill(sk.core_skills.TextMemorySkill())" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Manually adding memories\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Let's create some initial memories \"About Me\". We can add memories to our weaviate memory store by using `save_information_async`" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "COLLECTION = \"AboutMe\"" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "async def populate_memory(kernel: sk.Kernel) -> None:\n", - " # Add some documents to the semantic memory\n", - " await kernel.memory.save_information_async(\n", - " COLLECTION, id=\"info1\", text=\"My name is Andrea\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " COLLECTION, id=\"info2\", text=\"I currently work as a tour guide\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " COLLECTION, id=\"info3\", text=\"I've been living in Seattle since 2005\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " COLLECTION, id=\"info4\", text=\"I visited France and Italy five times since 2015\"\n", - " )\n", - " await kernel.memory.save_information_async(\n", - " COLLECTION, id=\"info5\", text=\"My family is from New York\"\n", - " )" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Searching is done through `search_async`:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "async def search_memory_examples(kernel: sk.Kernel) -> None:\n", - " questions = [\n", - " \"what's my name\",\n", - " \"where do I live?\",\n", - " \"where's my family from?\",\n", - " \"where have I traveled?\",\n", - " \"what do I do for work\",\n", - " ]\n", - "\n", - " for question in questions:\n", - " print(f\"Question: {question}\")\n", - " result = await kernel.memory.search_async(COLLECTION, question)\n", - " print(f\"Answer: {result[0].text}\\n\")" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Let's see the results of the functions:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "print(\"Populating memory...\")\n", - "await populate_memory(kernel)\n", - "\n", - "print(\"Asking questions... (manually)\")\n", - "await search_memory_examples(kernel)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Here's how to use the weaviate memory store in a chat application:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "async def setup_chat_with_memory(\n", - " kernel: sk.Kernel,\n", - ") -> Tuple[sk.SKFunctionBase, sk.SKContext]:\n", - " sk_prompt = \"\"\"\n", - " ChatBot can have a conversation with you about any topic.\n", - " It can give explicit instructions or say 'I don't know' if\n", - " it does not have an answer.\n", - "\n", - " Information about me, from previous conversations:\n", - " - {{$fact1}} {{recall $fact1}}\n", - " - {{$fact2}} {{recall $fact2}}\n", - " - {{$fact3}} {{recall $fact3}}\n", - " - {{$fact4}} {{recall $fact4}}\n", - " - {{$fact5}} {{recall $fact5}}\n", - "\n", - " Chat:\n", - " {{$chat_history}}\n", - " User: {{$user_input}}\n", - " ChatBot: \"\"\".strip()\n", - "\n", - " chat_func = kernel.create_semantic_function(\n", - " sk_prompt, max_tokens=200, temperature=0.8\n", - " )\n", - "\n", - " context = kernel.create_new_context()\n", - " context[\"fact1\"] = \"what is my name?\"\n", - " context[\"fact2\"] = \"where do I live?\"\n", - " context[\"fact3\"] = \"where's my family from?\"\n", - " context[\"fact4\"] = \"where have I traveled?\"\n", - " context[\"fact5\"] = \"what do I do for work?\"\n", - "\n", - " context[sk.core_skills.TextMemorySkill.COLLECTION_PARAM] = COLLECTION\n", - " context[sk.core_skills.TextMemorySkill.RELEVANCE_PARAM] = 0.8\n", - "\n", - " context[\"chat_history\"] = \"\"\n", - "\n", - " return chat_func, context" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "async def chat(\n", - " kernel: sk.Kernel, chat_func: sk.SKFunctionBase, context: sk.SKContext\n", - ") -> bool:\n", - " try:\n", - " user_input = input(\"User:> \")\n", - " context[\"user_input\"] = user_input\n", - " except KeyboardInterrupt:\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - " except EOFError:\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - "\n", - " if user_input == \"exit\":\n", - " print(\"\\n\\nExiting chat...\")\n", - " return False\n", - "\n", - " answer = await kernel.run_async(chat_func, input_vars=context.variables)\n", - " context[\"chat_history\"] += f\"\\nUser:> {user_input}\\nChatBot:> {answer}\\n\"\n", - "\n", - " print(f\"ChatBot:> {answer}\")\n", - " return True" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "print(\"Setting up a chat (with memory!)\")\n", - "chat_func, context = await setup_chat_with_memory(kernel)\n", - "\n", - "print(\"Begin chatting (type 'exit' to exit):\\n\")\n", - "chatting = True\n", - "while chatting:\n", - " chatting = await chat(kernel, chat_func, context)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Adding documents to your memory" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Create a dictionary to hold some files. The key is the hyperlink to the file and the value is the file's content:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "github_files = {}\n", - "github_files[\n", - " \"https://github.com/microsoft/semantic-kernel/blob/main/README.md\"\n", - "] = \"README: Installation, getting started, and how to contribute\"\n", - "github_files[\n", - " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/02-running-prompts-from-file.ipynb\"\n", - "] = \"Jupyter notebook describing how to pass prompts from a file to a semantic skill or function\"\n", - "github_files[\n", - " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/00-getting-started.ipynb\"\n", - "] = \"Jupyter notebook describing how to get started with the Semantic Kernel\"\n", - "github_files[\n", - " \"https://github.com/microsoft/semantic-kernel/tree/main/samples/skills/ChatSkill/ChatGPT\"\n", - "] = \"Sample demonstrating how to create a chat skill interfacing with ChatGPT\"\n", - "github_files[\n", - " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/src/SemanticKernel/Memory/Volatile/VolatileMemoryStore.cs\"\n", - "] = \"C# class that defines a volatile embedding store\"" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Use `save_reference_async` to save the file:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "COLLECTION = \"SKGitHub\"\n", - "\n", - "print(\n", - " \"Adding some GitHub file URLs and their descriptions to a volatile Semantic Memory.\"\n", - ")\n", - "i = 0\n", - "for entry, value in github_files.items():\n", - " await kernel.memory.save_reference_async(\n", - " collection=COLLECTION,\n", - " description=value,\n", - " text=value,\n", - " external_id=entry,\n", - " external_source_name=\"GitHub\",\n", - " )\n", - " i += 1\n", - " print(\" URL {} saved\".format(i))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Use `search_async` to ask a question:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "ask = \"I love Jupyter notebooks, how should I get started?\"\n", - "print(\"===========================\\n\" + \"Query: \" + ask + \"\\n\")\n", - "\n", - "memories = await kernel.memory.search_async(\n", - " COLLECTION, ask, limit=5, min_relevance_score=0.77\n", - ")\n", - "\n", - "i = 0\n", - "for memory in memories:\n", - " i += 1\n", - " print(f\"Result {i}:\")\n", - " print(\" URL: : \" + memory.id)\n", - " print(\" Title : \" + memory.description)\n", - " print(\" Relevance: \" + str(memory.relevance))\n", - " print()" - ] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.13" - } - }, - "nbformat": 4, - "nbformat_minor": 2 + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Introduction" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This notebook shows how to replace the `VolatileMemoryStore` memory storage used in a [previous notebook](./06-memory-and-embeddings.ipynb) with a `WeaviateMemoryStore`.\n", + "\n", + "`WeaviateMemoryStore` is an example of a persistent (i.e. long-term) memory store backed by the Weaviate vector database." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# About Weaviate" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "[Weaviate](https://weaviate.io/) is an open-source vector database designed to scale seamlessly into billions of data objects. This implementation supports hybrid search out-of-the-box (meaning it will perform better for keyword searches)." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can run Weaviate in 5 ways:\n", + "\n", + "- **SaaS** – with [Weaviate Cloud Services (WCS)](https://weaviate.io/pricing).\n", + "\n", + " WCS is a fully managed service that takes care of hosting, scaling, and updating your Weaviate instance. You can try it out for free with a sandbox that lasts for 14 days.\n", + "\n", + " To set up a SaaS Weaviate instance with WCS:\n", + "\n", + " 1. Navigate to [Weaviate Cloud Console](https://console.weaviate.cloud/).\n", + " 2. Register or sign in to your WCS account.\n", + " 3. Create a new cluster with the following settings:\n", + " - `Subscription Tier` – Free sandbox for a free trial, or contact [hello@weaviate.io](mailto:hello@weaviate.io) for other options.\n", + " - `Cluster name` – a unique name for your cluster. The name will become part of the URL used to access this instance.\n", + " - `Enable Authentication?` – Enabled by default. This will generate a static API key that you can use to authenticate.\n", + " 4. Wait for a few minutes until your cluster is ready. You will see a green tick ✔️ when it's done. Copy your cluster URL.\n", + "\n", + "- **Hybrid SaaS**\n", + "\n", + " > If you need to keep your data on-premise for security or compliance reasons, Weaviate also offers a Hybrid SaaS option: Weaviate runs within your cloud instances, but the cluster is managed remotely by Weaviate. This gives you the benefits of a managed service without sending data to an external party.\n", + "\n", + " The Weaviate Hybrid SaaS is a custom solution. If you are interested in this option, please reach out to [hello@weaviate.io](mailto:hello@weaviate.io).\n", + "\n", + "- **Self-hosted** – with a Docker container\n", + "\n", + " To set up a Weaviate instance with Docker:\n", + "\n", + " 1. [Install Docker](https://docs.docker.com/engine/install/) on your local machine if it is not already installed.\n", + " 2. [Install the Docker Compose Plugin](https://docs.docker.com/compose/install/)\n", + " 3. Download a `docker-compose.yml` file with this `curl` command:\n", + "\n", + " ```\n", + " curl -o docker-compose.yml \"https://configuration.weaviate.io/v2/docker-compose/docker-compose.yml?modules=standalone&runtime=docker-compose&weaviate_version=v1.19.6\"\n", + " ```\n", + "\n", + " Alternatively, you can use Weaviate's docker compose [configuration tool](https://weaviate.io/developers/weaviate/installation/docker-compose) to generate your own `docker-compose.yml` file.\n", + "\n", + " 4. Run `docker compose up -d` to spin up a Weaviate instance.\n", + "\n", + " > To shut it down, run `docker compose down`.\n", + "\n", + "- **Self-hosted** – with a Kubernetes cluster\n", + "\n", + " To configure a self-hosted instance with Kubernetes, follow Weaviate's [documentation](https://weaviate.io/developers/weaviate/installation/kubernetes).|\n", + "\n", + "- **Embedded** - start a weaviate instance right from your application code using the client library\n", + " \n", + " This code snippet shows how to instantiate an embedded weaviate instance and upload a document:\n", + "\n", + " ```python\n", + " import weaviate\n", + " from weaviate.embedded import EmbeddedOptions\n", + "\n", + " client = weaviate.Client(\n", + " embedded_options=EmbeddedOptions()\n", + " )\n", + "\n", + " data_obj = {\n", + " \"name\": \"Chardonnay\",\n", + " \"description\": \"Goes with fish\"\n", + " }\n", + "\n", + " client.data_object.create(data_obj, \"Wine\")\n", + " ```\n", + " \n", + " Refer to the [documentation](https://weaviate.io/developers/weaviate/installation/embedded) for more details about this deployment method." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Setup" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "!pip install semantic-kernel==0.3.8.dev0\n", + "!pip install weaviate-client\n", + "!pip install python-dotenv" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## OS-specific notes:\n", + "* if you run into SSL errors when connecting to OpenAI on macOS, see this issue for a [potential solution](https://github.com/microsoft/semantic-kernel/issues/627#issuecomment-1580912248)\n", + "* on Windows, you may need to run Docker Desktop as administrator" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from typing import Tuple\n", + "\n", + "import semantic_kernel as sk\n", + "from semantic_kernel.connectors.ai.open_ai import (\n", + " OpenAIChatCompletion,\n", + " OpenAITextEmbedding,\n", + ")\n", + "\n", + "import os" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "First, we instantiate the Weaviate memory store. Uncomment ONE of the options below, depending on how you want to use Weaviate:\n", + "* from a Docker instance\n", + "* from WCS\n", + "* directly from the client (embedded Weaviate), which works on Linux only at the moment" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from semantic_kernel.connectors.memory.weaviate import weaviate_memory_store\n", + "from dotenv import load_dotenv\n", + "\n", + "load_dotenv(override=True)\n", + "\n", + "# Using Docker\n", + "config = weaviate_memory_store.WeaviateConfig(url=\"http://localhost:8080\")\n", + "\n", + "# Using WCS. Make sure the environment variables `WEAVIATE_URL` and `WEAVIATE_API_KEY`\n", + "# were set in the `.env` file.\n", + "#\n", + "# weaviate_api, weaviate_url = sk.weaviate_settings_from_dot_env()\n", + "#\n", + "# config = weaviate_memory_store.WeaviateConfig(\n", + "# url=weaviate_url,\n", + "# api_key=weaviate_api\n", + "# )\n", + "\n", + "# Using Embedded Weaviate\n", + "# config = weaviate_memory_store.WeaviateConfig(use_embed=True)\n", + "\n", + "store = weaviate_memory_store.WeaviateMemoryStore(config=config)\n", + "store.client.schema.delete_all()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Then, we register the memory store to the kernel:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "kernel = sk.Kernel()\n", + "\n", + "api_key, org_id = sk.openai_settings_from_dot_env()\n", + "kernel.add_chat_service(\"chat-gpt\", OpenAIChatCompletion(\"gpt-3.5-turbo\", api_key, org_id))\n", + "kernel.add_text_embedding_generation_service(\"ada\", OpenAITextEmbedding(\"text-embedding-ada-002\", api_key, org_id))\n", + "\n", + "kernel.register_memory_store(memory_store=store)\n", + "kernel.import_skill(sk.core_skills.TextMemorySkill())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Manually adding memories\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's create some initial memories \"About Me\". We can add memories to our weaviate memory store by using `save_information_async`" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "COLLECTION = \"AboutMe\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "async def populate_memory(kernel: sk.Kernel) -> None:\n", + " # Add some documents to the semantic memory\n", + " await kernel.memory.save_information_async(COLLECTION, id=\"info1\", text=\"My name is Andrea\")\n", + " await kernel.memory.save_information_async(COLLECTION, id=\"info2\", text=\"I currently work as a tour guide\")\n", + " await kernel.memory.save_information_async(COLLECTION, id=\"info3\", text=\"I've been living in Seattle since 2005\")\n", + " await kernel.memory.save_information_async(\n", + " COLLECTION, id=\"info4\", text=\"I visited France and Italy five times since 2015\"\n", + " )\n", + " await kernel.memory.save_information_async(COLLECTION, id=\"info5\", text=\"My family is from New York\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Searching is done through `search_async`:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "async def search_memory_examples(kernel: sk.Kernel) -> None:\n", + " questions = [\n", + " \"what's my name\",\n", + " \"where do I live?\",\n", + " \"where's my family from?\",\n", + " \"where have I traveled?\",\n", + " \"what do I do for work\",\n", + " ]\n", + "\n", + " for question in questions:\n", + " print(f\"Question: {question}\")\n", + " result = await kernel.memory.search_async(COLLECTION, question)\n", + " print(f\"Answer: {result[0].text}\\n\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's see the results of the functions:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "print(\"Populating memory...\")\n", + "await populate_memory(kernel)\n", + "\n", + "print(\"Asking questions... (manually)\")\n", + "await search_memory_examples(kernel)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Here's how to use the weaviate memory store in a chat application:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "async def setup_chat_with_memory(\n", + " kernel: sk.Kernel,\n", + ") -> Tuple[sk.SKFunctionBase, sk.SKContext]:\n", + " sk_prompt = \"\"\"\n", + " ChatBot can have a conversation with you about any topic.\n", + " It can give explicit instructions or say 'I don't know' if\n", + " it does not have an answer.\n", + "\n", + " Information about me, from previous conversations:\n", + " - {{$fact1}} {{recall $fact1}}\n", + " - {{$fact2}} {{recall $fact2}}\n", + " - {{$fact3}} {{recall $fact3}}\n", + " - {{$fact4}} {{recall $fact4}}\n", + " - {{$fact5}} {{recall $fact5}}\n", + "\n", + " Chat:\n", + " {{$chat_history}}\n", + " User: {{$user_input}}\n", + " ChatBot: \"\"\".strip()\n", + "\n", + " chat_func = kernel.create_semantic_function(sk_prompt, max_tokens=200, temperature=0.8)\n", + "\n", + " context = kernel.create_new_context()\n", + " context[\"fact1\"] = \"what is my name?\"\n", + " context[\"fact2\"] = \"where do I live?\"\n", + " context[\"fact3\"] = \"where's my family from?\"\n", + " context[\"fact4\"] = \"where have I traveled?\"\n", + " context[\"fact5\"] = \"what do I do for work?\"\n", + "\n", + " context[sk.core_skills.TextMemorySkill.COLLECTION_PARAM] = COLLECTION\n", + " context[sk.core_skills.TextMemorySkill.RELEVANCE_PARAM] = 0.8\n", + "\n", + " context[\"chat_history\"] = \"\"\n", + "\n", + " return chat_func, context" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "async def chat(kernel: sk.Kernel, chat_func: sk.SKFunctionBase, context: sk.SKContext) -> bool:\n", + " try:\n", + " user_input = input(\"User:> \")\n", + " context[\"user_input\"] = user_input\n", + " except KeyboardInterrupt:\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + " except EOFError:\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + "\n", + " if user_input == \"exit\":\n", + " print(\"\\n\\nExiting chat...\")\n", + " return False\n", + "\n", + " answer = await kernel.run_async(chat_func, input_vars=context.variables)\n", + " context[\"chat_history\"] += f\"\\nUser:> {user_input}\\nChatBot:> {answer}\\n\"\n", + "\n", + " print(f\"ChatBot:> {answer}\")\n", + " return True" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "print(\"Setting up a chat (with memory!)\")\n", + "chat_func, context = await setup_chat_with_memory(kernel)\n", + "\n", + "print(\"Begin chatting (type 'exit' to exit):\\n\")\n", + "chatting = True\n", + "while chatting:\n", + " chatting = await chat(kernel, chat_func, context)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Adding documents to your memory" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Create a dictionary to hold some files. The key is the hyperlink to the file and the value is the file's content:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "github_files = {}\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/README.md\"\n", + "] = \"README: Installation, getting started, and how to contribute\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/02-running-prompts-from-file.ipynb\"\n", + "] = \"Jupyter notebook describing how to pass prompts from a file to a semantic skill or function\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/notebooks/00-getting-started.ipynb\"\n", + "] = \"Jupyter notebook describing how to get started with the Semantic Kernel\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/tree/main/samples/skills/ChatSkill/ChatGPT\"\n", + "] = \"Sample demonstrating how to create a chat skill interfacing with ChatGPT\"\n", + "github_files[\n", + " \"https://github.com/microsoft/semantic-kernel/blob/main/dotnet/src/SemanticKernel/Memory/Volatile/VolatileMemoryStore.cs\"\n", + "] = \"C# class that defines a volatile embedding store\"" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use `save_reference_async` to save the file:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "COLLECTION = \"SKGitHub\"\n", + "\n", + "print(\"Adding some GitHub file URLs and their descriptions to a volatile Semantic Memory.\")\n", + "i = 0\n", + "for entry, value in github_files.items():\n", + " await kernel.memory.save_reference_async(\n", + " collection=COLLECTION,\n", + " description=value,\n", + " text=value,\n", + " external_id=entry,\n", + " external_source_name=\"GitHub\",\n", + " )\n", + " i += 1\n", + " print(\" URL {} saved\".format(i))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use `search_async` to ask a question:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "ask = \"I love Jupyter notebooks, how should I get started?\"\n", + "print(\"===========================\\n\" + \"Query: \" + ask + \"\\n\")\n", + "\n", + "memories = await kernel.memory.search_async(COLLECTION, ask, limit=5, min_relevance_score=0.77)\n", + "\n", + "i = 0\n", + "for memory in memories:\n", + " i += 1\n", + " print(f\"Result {i}:\")\n", + " print(\" URL: : \" + memory.id)\n", + " print(\" Title : \" + memory.description)\n", + " print(\" Relevance: \" + str(memory.relevance))\n", + " print()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.13" + } + }, + "nbformat": 4, + "nbformat_minor": 2 } diff --git a/python/pyproject.toml b/python/pyproject.toml index efcdda603260..cc420dd549e7 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "semantic-kernel" -version = "0.4.3.dev" +version = "0.4.4.dev" description = "Semantic Kernel Python SDK" authors = ["Microsoft "] readme = "pip/README.md" diff --git a/python/samples/kernel-syntax-examples/openai_logit_bias.py b/python/samples/kernel-syntax-examples/openai_logit_bias.py index ea736bdcc653..d049debabb6a 100644 --- a/python/samples/kernel-syntax-examples/openai_logit_bias.py +++ b/python/samples/kernel-syntax-examples/openai_logit_bias.py @@ -1,9 +1,17 @@ # Copyright (c) Microsoft. All rights reserved. import asyncio +from typing import Any, Dict import semantic_kernel as sk import semantic_kernel.connectors.ai.open_ai as sk_oai +from semantic_kernel.connectors.ai.ai_request_settings import AIRequestSettings +from semantic_kernel.connectors.ai.chat_completion_client_base import ( + ChatCompletionClientBase, +) +from semantic_kernel.connectors.ai.text_completion_client_base import ( + TextCompletionClientBase, +) """ Logit bias enables prioritizing certain tokens within a given output. @@ -13,13 +21,11 @@ """ -def _config_ban_tokens(settings_type, keys): - settings = sk_oai.OpenAIRequestSettings() - +def _config_ban_tokens(settings: AIRequestSettings, keys: Dict[Any, Any]): # Map each token in the keys list to a bias value from -100 (a potential ban) to 100 (exclusive selection) for k in keys: # -100 to potentially ban all tokens in the list - settings.token_selection_biases[k] = -100 + settings.logit_bias[k] = -100 return settings @@ -59,7 +65,8 @@ async def chat_request_example(kernel, api_key, org_id): ] # Model will try its best to avoid using any of the above words - settings = _config_ban_tokens("chat", keys) + settings = kernel.get_request_settings_from_service(ChatCompletionClientBase, "chat_service") + settings = _config_ban_tokens(settings, keys) prompt_config = sk.PromptTemplateConfig.from_completion_parameters(max_tokens=2000, temperature=0.7, top_p=0.8) prompt_template = sk.ChatPromptTemplate("{{$user_input}}", kernel.prompt_template_engine, prompt_config) @@ -71,15 +78,18 @@ async def chat_request_example(kernel, api_key, org_id): function_config = sk.SemanticFunctionConfig(prompt_config, prompt_template) kernel.register_semantic_function("ChatBot", "Chat", function_config) - chat_messages = list() + chat_messages = [] + messages = [{"role": "user", "content": user_mssg}] + chat_messages.append(("user", user_mssg)) - answer = await openai_chat_completion.complete_chat_async(chat_messages, settings) - chat_messages.append(("assistant", str(answer))) + answer = await openai_chat_completion.complete_chat_async(messages=messages, settings=settings) + chat_messages.append(("assistant", str(answer[0]))) user_mssg = "What are his best all-time stats?" + messages = [{"role": "user", "content": user_mssg}] chat_messages.append(("user", user_mssg)) - answer = await openai_chat_completion.complete_chat_async(chat_messages, settings) - chat_messages.append(("assistant", str(answer))) + answer = await openai_chat_completion.complete_chat_async(messages=messages, settings=settings) + chat_messages.append(("assistant", str(answer[0]))) context_vars = sk.ContextVariables() context_vars["chat_history"] = "" @@ -140,7 +150,8 @@ async def text_complete_request_example(kernel, api_key, org_id): ] # Model will try its best to avoid using any of the above words - settings = _config_ban_tokens("complete", keys) + settings = kernel.get_request_settings_from_service(TextCompletionClientBase, "text_service") + settings = _config_ban_tokens(settings, keys) user_mssg = "The best pie flavor to have in autumn is" answer = await openai_text_completion.complete_async(user_mssg, settings) diff --git a/python/semantic_kernel/connectors/ai/hugging_face/hf_request_settings.py b/python/semantic_kernel/connectors/ai/hugging_face/hf_request_settings.py index b20948014d41..3928649af400 100644 --- a/python/semantic_kernel/connectors/ai/hugging_face/hf_request_settings.py +++ b/python/semantic_kernel/connectors/ai/hugging_face/hf_request_settings.py @@ -28,7 +28,7 @@ def prepare_settings_dict(self, **kwargs) -> Dict[str, Any]: gen_config = self.get_generation_config() if "prompt" in kwargs and kwargs["prompt"] is not None: return { - "prompt": kwargs["prompt"], + "text_inputs": kwargs["prompt"], "generation_config": gen_config, "num_return_sequences": self.num_return_sequences, "do_sample": self.do_sample, diff --git a/python/semantic_kernel/connectors/ai/hugging_face/services/hf_text_completion.py b/python/semantic_kernel/connectors/ai/hugging_face/services/hf_text_completion.py index 5502ed6f1053..6ccbd7566e15 100644 --- a/python/semantic_kernel/connectors/ai/hugging_face/services/hf_text_completion.py +++ b/python/semantic_kernel/connectors/ai/hugging_face/services/hf_text_completion.py @@ -81,7 +81,7 @@ async def complete_async( if kwargs.get("logger"): logger.warning("The `logger` parameter is deprecated. Please use the `logging` module instead.") try: - results = self.generator(**request_settings.prepare_settings_dict(prompt)) + results = self.generator(**request_settings.prepare_settings_dict(prompt=prompt)) result_field_name = "summary_text" if self.task == "summarization" else "generated_text" if len(results) == 1: return results[0][result_field_name] diff --git a/python/semantic_kernel/connectors/ai/open_ai/request_settings/open_ai_request_settings.py b/python/semantic_kernel/connectors/ai/open_ai/request_settings/open_ai_request_settings.py index e48ead848046..3e5eca639dc5 100644 --- a/python/semantic_kernel/connectors/ai/open_ai/request_settings/open_ai_request_settings.py +++ b/python/semantic_kernel/connectors/ai/open_ai/request_settings/open_ai_request_settings.py @@ -14,7 +14,7 @@ class OpenAIRequestSettings(AIRequestSettings): ai_model_id: Optional[str] = Field(None, serialization_alias="model") frequency_penalty: float = Field(0.0, ge=-2.0, le=2.0) - logit_bias: Dict[str, float] = Field(default_factory=dict) + logit_bias: Dict[Union[str, int], float] = Field(default_factory=dict) max_tokens: int = Field(256, gt=0) number_of_responses: int = Field(1, ge=1, le=128, serialization_alias="n") presence_penalty: float = Field(0.0, ge=-2.0, le=2.0) From 1c2d0fe4b3350224184230608f6b5bef025ed3fc Mon Sep 17 00:00:00 2001 From: Gil LaHaye Date: Fri, 5 Jan 2024 09:51:56 -0800 Subject: [PATCH 3/5] .Net: Avoid causing first-chance exceptions in CodeTokenizer (#4471) ### Motivation and Context The CodeTokenizer routinely causes first-chance (caught) exceptions to determine whether tokens belong to function names of named argument blocks. This is inefficient but also can be startling depending on how one has set one's configuration for breaking on exceptions. See #4418 ### Description CodeTokenizer now uses a new method from NamedArgBlock to determine whether a string could result in a NamedArgBlock instead of resorting to causing exceptions to gather the same information. ### Contribution Checklist - [ ] The code builds clean without any errors or warnings - [ ] The PR follows the [SK Contribution Guidelines](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md) and the [pre-submission formatting script](https://github.com/microsoft/semantic-kernel/blob/main/CONTRIBUTING.md#development-scripts) raises no violations - [ ] All unit tests pass, and I have added new tests where possible - [ ] I didn't break anyone :smile: --- .../TemplateEngine/Blocks/NamedArgBlock.cs | 42 ++++++++++++++----- .../TemplateEngine/CodeTokenizer.cs | 11 +++-- .../Blocks/NamedArgBlockTests.cs | 6 +-- .../TemplateEngine/CodeTokenizerTests.cs | 8 ++-- 4 files changed, 44 insertions(+), 23 deletions(-) diff --git a/dotnet/src/SemanticKernel.Core/TemplateEngine/Blocks/NamedArgBlock.cs b/dotnet/src/SemanticKernel.Core/TemplateEngine/Blocks/NamedArgBlock.cs index 2ab6b23b4a99..2da0df2dd1b2 100644 --- a/dotnet/src/SemanticKernel.Core/TemplateEngine/Blocks/NamedArgBlock.cs +++ b/dotnet/src/SemanticKernel.Core/TemplateEngine/Blocks/NamedArgBlock.cs @@ -1,5 +1,6 @@ // Copyright (c) Microsoft. All rights reserved. +using System; using System.Text.RegularExpressions; using Microsoft.Extensions.Logging; @@ -35,21 +36,14 @@ internal sealed class NamedArgBlock : Block, ITextRendering public NamedArgBlock(string? text, ILoggerFactory? logger = null) : base(NamedArgBlock.TrimWhitespace(text), logger) { - var argParts = this.Content.Split(Symbols.NamedArgBlockSeparator); - if (argParts.Length != 2) + if (!TryGetNameAndValue(this.Content, out string argName, out string argValue)) { this.Logger.LogError("Invalid named argument `{Text}`", text); throw new KernelException($"A function named argument must contain a name and value separated by a '{Symbols.NamedArgBlockSeparator}' character."); } - this.Name = argParts[0]; - this._argNameAsVarBlock = new VarBlock($"{Symbols.VarPrefix}{argParts[0]}"); - var argValue = argParts[1]; - if (argValue.Length == 0) - { - this.Logger.LogError("Invalid named argument `{Text}`", text); - throw new KernelException($"A function named argument must contain a quoted value or variable after the '{Symbols.NamedArgBlockSeparator}' character."); - } + this.Name = argName; + this._argNameAsVarBlock = new VarBlock($"{Symbols.VarPrefix}{argName}"); if (argValue[0] == Symbols.VarPrefix) { @@ -61,6 +55,34 @@ public NamedArgBlock(string? text, ILoggerFactory? logger = null) } } + /// + /// Attempts to extract the name and value of a named argument block from a string + /// + /// String from which to extract a name and value + /// Name extracted from argument block, when successful. Empty string otherwise. + /// Value extracted from argument block, when successful. Empty string otherwise. + /// true when a name and value are successfully extracted from the given text, false otherwise + internal static bool TryGetNameAndValue(string? text, out string name, out string value) + { + name = string.Empty; + value = string.Empty; + + if (!string.IsNullOrEmpty(text)) + { + string[] argBlockParts = text!.Split(new char[] { Symbols.NamedArgBlockSeparator }, StringSplitOptions.RemoveEmptyEntries); + + if (argBlockParts.Length == 2) + { + name = argBlockParts[0]; + value = argBlockParts[1]; + + return true; + } + } + + return false; + } + /// /// Gets the rendered value of the function argument. If the value is a , the value stays the same. /// If the value is a , the value of the variable is determined by the arguments passed in. diff --git a/dotnet/src/SemanticKernel.Core/TemplateEngine/CodeTokenizer.cs b/dotnet/src/SemanticKernel.Core/TemplateEngine/CodeTokenizer.cs index ed11e57b59f9..44206060aaf0 100644 --- a/dotnet/src/SemanticKernel.Core/TemplateEngine/CodeTokenizer.cs +++ b/dotnet/src/SemanticKernel.Core/TemplateEngine/CodeTokenizer.cs @@ -322,14 +322,13 @@ private static bool CanBeEscaped(char c) Justification = "Does not throw an exception by design.")] private static bool IsValidNamedArg(string tokenContent) { - try + if (NamedArgBlock.TryGetNameAndValue(tokenContent, out string _, out string _)) { var tokenContentAsNamedArg = new NamedArgBlock(tokenContent); - return tokenContentAsNamedArg.IsValid(out var error); - } - catch - { - return false; + + return tokenContentAsNamedArg.IsValid(out string _); } + + return false; } } diff --git a/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/Blocks/NamedArgBlockTests.cs b/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/Blocks/NamedArgBlockTests.cs index 9353b87e8fcd..2e6fb7052ecf 100644 --- a/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/Blocks/NamedArgBlockTests.cs +++ b/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/Blocks/NamedArgBlockTests.cs @@ -115,11 +115,11 @@ public void ArgValueNeedsQuoteOrDollarSignPrefix() public void ArgNameShouldBeNonEmpty() { // Arrange - var target = new NamedArgBlock("='b'"); + static NamedArgBlock funcToTest() => new("='b'"); // Act + Assert - Assert.False(target.IsValid(out var error)); - Assert.Equal("A named argument must have a name", error); + KernelException exception = Assert.Throws(funcToTest); + Assert.Equal("A function named argument must contain a name and value separated by a '=' character.", exception.Message); } [Fact] diff --git a/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/CodeTokenizerTests.cs b/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/CodeTokenizerTests.cs index 62d90dbfe5b2..d6c185386547 100644 --- a/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/CodeTokenizerTests.cs +++ b/dotnet/src/SemanticKernel.UnitTests/TemplateEngine/CodeTokenizerTests.cs @@ -209,12 +209,12 @@ public void ItThrowsWhenSeparatorsAreMissing(string template) } [Theory] - [InlineData("f a =", "A function named argument must contain a quoted value or variable after the '=' character.")] - [InlineData("f a='b' arg2", "A function named argument must contain a name and value separated by a '=' character.")] - public void ItThrowsWhenArgValueIsMissing(string template, string expectedErrorMessage) + [InlineData("f a =")] + [InlineData("f a='b' arg2")] + public void ItThrowsWhenArgValueIsMissing(string template) { // Act & Assert var exception = Assert.Throws(() => this._target.Tokenize(template)); - Assert.Equal(expectedErrorMessage, exception.Message); + Assert.Equal("A function named argument must contain a name and value separated by a '=' character.", exception.Message); } } From 86cb05fde595d49503fad45fd7f525f7d68e3213 Mon Sep 17 00:00:00 2001 From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com> Date: Mon, 8 Jan 2024 07:53:45 +0000 Subject: [PATCH 4/5] .Net: Bump xunit.analyzers from 1.7.0 to 1.8.0 in /dotnet (#4426) Bumps [xunit.analyzers](https://github.com/xunit/xunit.analyzers) from 1.7.0 to 1.8.0.
Commits
  • 559d488 v1.8.0
  • 7b8a772 Support Roslyn 3.11, 4.2, 4.4, 4.6, and 4.8
  • 8edaa4a Update build scripts for the new .NET SDK 8 requirement
  • 8aa39e4 xunit/xunit#2849: Update xUnit1030 to handle ConfigureAwaitOptions
  • 49afdc9 Restructure DoNotUseConfigureAwaitFixerTests
  • a041234 Restructure DoNotUseConfigureAwaitTests
  • a34764a Update dependencies, and upgrade builder/test projects to .NET 8
  • bc3fd98 Shift xUnit1041 to be a Warning instead of an Error
  • 4db8815 xunit/xunit#2846: Optional parameters should not trigger xUnit1041
  • 9ca8812 Turn off CA1014
  • Additional commits viewable in compare view

[![Dependabot compatibility score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=xunit.analyzers&package-manager=nuget&previous-version=1.7.0&new-version=1.8.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores) Dependabot will resolve any conflicts with this PR as long as you don't alter it yourself. You can also trigger a rebase manually by commenting `@dependabot rebase`. [//]: # (dependabot-automerge-start) [//]: # (dependabot-automerge-end) ---
Dependabot commands and options
You can trigger Dependabot actions by commenting on this PR: - `@dependabot rebase` will rebase this PR - `@dependabot recreate` will recreate this PR, overwriting any edits that have been made to it - `@dependabot merge` will merge this PR after your CI passes on it - `@dependabot squash and merge` will squash and merge this PR after your CI passes on it - `@dependabot cancel merge` will cancel a previously requested merge and block automerging - `@dependabot reopen` will reopen this PR if it is closed - `@dependabot close` will close this PR and stop Dependabot recreating it. You can achieve the same result by closing it manually - `@dependabot show ignore conditions` will show all of the ignore conditions of the specified dependency - `@dependabot ignore this major version` will close this PR and stop Dependabot creating any more for this major version (unless you reopen the PR or upgrade to it yourself) - `@dependabot ignore this minor version` will close this PR and stop Dependabot creating any more for this minor version (unless you reopen the PR or upgrade to it yourself) - `@dependabot ignore this dependency` will close this PR and stop Dependabot creating any more for this dependency (unless you reopen the PR or upgrade to it yourself)
Signed-off-by: dependabot[bot] Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> --- dotnet/Directory.Packages.props | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dotnet/Directory.Packages.props b/dotnet/Directory.Packages.props index f512f324f306..657e599a5382 100644 --- a/dotnet/Directory.Packages.props +++ b/dotnet/Directory.Packages.props @@ -91,7 +91,7 @@ all runtime; build; native; contentfiles; analyzers; buildtransitive - + all runtime; build; native; contentfiles; analyzers; buildtransitive From 9db47e56155cf8cf4da3d4d1b95bde4833d80108 Mon Sep 17 00:00:00 2001 From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com> Date: Mon, 8 Jan 2024 07:54:30 +0000 Subject: [PATCH 5/5] .Net: Bump xunit from 2.6.3 to 2.6.4 in /dotnet (#4425) Bumps [xunit](https://github.com/xunit/xunit) from 2.6.3 to 2.6.4.
Commits

[![Dependabot compatibility score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=xunit&package-manager=nuget&previous-version=2.6.3&new-version=2.6.4)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores) Dependabot will resolve any conflicts with this PR as long as you don't alter it yourself. You can also trigger a rebase manually by commenting `@dependabot rebase`. [//]: # (dependabot-automerge-start) [//]: # (dependabot-automerge-end) ---
Dependabot commands and options
You can trigger Dependabot actions by commenting on this PR: - `@dependabot rebase` will rebase this PR - `@dependabot recreate` will recreate this PR, overwriting any edits that have been made to it - `@dependabot merge` will merge this PR after your CI passes on it - `@dependabot squash and merge` will squash and merge this PR after your CI passes on it - `@dependabot cancel merge` will cancel a previously requested merge and block automerging - `@dependabot reopen` will reopen this PR if it is closed - `@dependabot close` will close this PR and stop Dependabot recreating it. You can achieve the same result by closing it manually - `@dependabot show ignore conditions` will show all of the ignore conditions of the specified dependency - `@dependabot ignore this major version` will close this PR and stop Dependabot creating any more for this major version (unless you reopen the PR or upgrade to it yourself) - `@dependabot ignore this minor version` will close this PR and stop Dependabot creating any more for this minor version (unless you reopen the PR or upgrade to it yourself) - `@dependabot ignore this dependency` will close this PR and stop Dependabot creating any more for this dependency (unless you reopen the PR or upgrade to it yourself)
Signed-off-by: dependabot[bot] Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> --- dotnet/Directory.Packages.props | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dotnet/Directory.Packages.props b/dotnet/Directory.Packages.props index 657e599a5382..dde6071102d7 100644 --- a/dotnet/Directory.Packages.props +++ b/dotnet/Directory.Packages.props @@ -46,7 +46,7 @@ - +