docs: multi-agent docs (#1200)

firebase · Nov 7, 2024 · fc58fad · fc58fad
1 parent c358582
commit fc58fad
Show file tree

Hide file tree

Showing 4 changed files with 190 additions and 0 deletions.
diff --git a/docs/_guides.yaml b/docs/_guides.yaml
@@ -37,6 +37,8 @@ toc:
     path: /docs/genkit/tool-calling
   - title: Retrieval-augmented generation (RAG)
     path: /docs/genkit/rag
+  - title: Multi-agent systems
+    path: /docs/genkit/multi-agent
   - title: Evaluation
     path: /docs/genkit/evaluation
   - title: Observability & monitoring

diff --git a/docs/multi-agent.md b/docs/multi-agent.md
@@ -0,0 +1,53 @@
+# Building multi-agent systems
+
+A powerful application of large language models are LLM-powered agents. An agent
+is a system that can carry out complex tasks by planning how to break tasks into
+smaller ones, and (with the help of [tool calling](tool-calling)) execute tasks
+that interact with external resources such as databases or even physical
+devices.
+
+Here are some excerpts from a very simple customer service agent built using a
+single prompt and several tools:
+
+```ts
+{% includecode github_path="firebase/genkit/js/doc-snippets/src/multi-agent/simple.ts" region_tag="tools" adjust_indentation="auto" %}
+```
+
+```ts
+{% includecode github_path="firebase/genkit/js/doc-snippets/src/multi-agent/simple.ts" region_tag="chat" adjust_indentation="auto" %}
+```
+
+A simple architecture like the one shown above can be sufficient when your agent
+only has a few capabilities. However, even for the limited example above, you
+can see that there are some capabilities that customers would likely expect: for
+example, listing the customer's current reservations, canceling a reservation,
+and so on. As you build more and more tools to implement these additional
+capabilities, you start to run into some problems:
+
+*   The more tools you add, the more you stretch the model's ability to
+    consistently and correctly employ the right tool for the job.
+*   Some tasks might best be served through a more focused back and forth
+    between the user and the agent, rather than by a single tool call.
+*   Some tasks might benefit from a specialized prompt. For example, if your
+    agent is responding to an unhappy customer, you might want its tone to be
+    more business-like, whereas the agent that greets the customer initially can
+    have a more friendly and lighthearted tone.
+
+One approach you can use to deal with these issues that arise when building
+complex agents is to create many specialized agents and use a general purpose
+agent to delegate tasks to them. Genkit supports this architecture by allowing
+you to specify prompts as tools. Each prompt represents a single specialized
+agent, with its own set of tools available to it, and those agents are in turn
+available as tools to your single orchestration agent, which is the primary
+interface with the user.
+
+Here's what an expanded version of the previous example might look like as a
+multi-agent system:
+
+```ts
+{% includecode github_path="firebase/genkit/js/doc-snippets/src/multi-agent/multi.ts" region_tag="agents" adjust_indentation="auto" %}
+```
+
+```ts
+{% includecode github_path="firebase/genkit/js/doc-snippets/src/multi-agent/multi.ts" region_tag="chat" adjust_indentation="auto" %}
+```
diff --git a/js/doc-snippets/src/multi-agent/multi.ts b/js/doc-snippets/src/multi-agent/multi.ts
@@ -0,0 +1,62 @@
+/**
+ * Copyright 2024 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { genkit } from 'genkit';
+
+const ai = genkit({});
+const reservationTool = ai.defineTool(
+  {
+    name: '',
+    description: '',
+  },
+  async () => {}
+);
+const reservationCancelationTool = reservationTool;
+const reservationListTool = reservationTool;
+
+// [START agents]
+// Define a prompt that represents a specialist agent
+const reservationAgent = ai.definePrompt(
+  {
+    name: 'reservationAgent',
+    description: 'Reservation Agent can help manage guest reservations',
+    tools: [reservationTool, reservationCancelationTool, reservationListTool],
+  },
+  '{{role "system"}} Help guests make and manage reservations'
+);
+
+// Or load agents from .prompt files
+const menuInfoAgent = ai.prompt('menuInfoAgent');
+const complaintAgent = ai.prompt('complaintAgent');
+
+// The triage agent is the agent that users interact with initially
+const triageAgent = ai.definePrompt(
+  {
+    name: 'triageAgent',
+    description: 'Triage Agent',
+    tools: [reservationAgent, menuInfoAgent, complaintAgent],
+  },
+  `{{role "system"}} You are an AI customer service agent for Pavel's Cafe.
+  Greet the user and ask them how you can help. If appropriate, transfer to an
+  agent that can better handle the request. If you cannot help the customer with
+  the available tools, politely explain so.`
+);
+// [END agents]
+
+// [START chat]
+// Start a chat session, initially with the triage agent
+const chat = ai.chat({ preamble: triageAgent });
+// [END chat]
diff --git a/js/doc-snippets/src/multi-agent/simple.ts b/js/doc-snippets/src/multi-agent/simple.ts
@@ -0,0 +1,73 @@
+/**
+ * Copyright 2024 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { gemini15Pro } from '@genkit-ai/googleai';
+import { genkit, z } from 'genkit';
+
+const ai = genkit({});
+
+// [START tools]
+const menuLookupTool = ai.defineTool(
+  {
+    name: 'menuLookupTool',
+    description: 'use this tool to look up the menu for a given date',
+    inputSchema: z.object({
+      date: z.string().describe('the date to look up the menu for'),
+    }),
+    outputSchema: z.string().describe('the menu for a given date'),
+  },
+  async (input) => {
+    // Retrieve the menu from a database, website, etc.
+    // [START_EXCLUDE]
+    return '';
+    // [END_EXCLUDE]
+  }
+);
+
+const reservationTool = ai.defineTool(
+  {
+    name: 'reservationTool',
+    description: 'use this tool to try to book a reservation',
+    inputSchema: z.object({
+      partySize: z.coerce.number().describe('the number of guests'),
+      date: z.string().describe('the date to book for'),
+    }),
+    outputSchema: z
+      .string()
+      .describe(
+        "true if the reservation was successfully booked and false if there's" +
+          ' no table available for the requested time'
+      ),
+  },
+  async (input) => {
+    // Access your database to try to make the reservation.
+    // [START_EXCLUDE]
+    return '';
+    // [END_EXCLUDE]
+  }
+);
+// [END tools]
+
+// [START chat]
+const chat = ai.chat({
+  model: gemini15Pro,
+  system:
+    "You are an AI customer service agent for Pavel's Cafe. Use the tools " +
+    'available to you to help the customer. If you cannot help the ' +
+    'customer with the available tools, politely explain so.',
+  tools: [menuLookupTool, reservationTool],
+});
+// [END chat]