genkit-ai
diff --git a/‎.github/workflows/go.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/go.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎go/README.md‎
Lines changed: 73 additions & 16 deletions b/‎go/README.md‎
Lines changed: 73 additions & 16 deletions
diff --git a/‎go/ai/document.go‎
Lines changed: 27 additions & 0 deletions b/‎go/ai/document.go‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎go/ai/document_test.go‎
Lines changed: 106 additions & 0 deletions b/‎go/ai/document_test.go‎
Lines changed: 106 additions & 0 deletions
@@ -29,7 +29,7 @@ jobs:
     runs-on: ubuntu-latest
     strategy:
       matrix:
-        go-version: ['1.24.x']
+        go-version: ['1.25.x', '1.26.x']
     steps:
       - name: Checkout Repo
         uses: actions/checkout@main
 
@@ -53,7 +53,7 @@ func main() {
     g := genkit.Init(ctx, genkit.WithPlugins(&googlegenai.GoogleAI{}))
 
     answer, err := genkit.GenerateText(ctx, g,
-        ai.WithModelName("googleai/gemini-2.5-flash"),
+        ai.WithModelName("googleai/gemini-flash-latest"),
         ai.WithPrompt("Why is Go a great language for AI applications?"),
     )
     if err != nil {
@@ -80,7 +80,7 @@ Call any model with a simple, unified API:
 
 ```go
 text, _ := genkit.GenerateText(ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Explain quantum computing in simple terms."),
 )
 fmt.Println(text)
@@ -98,7 +98,7 @@ type Recipe struct {
 }
 
 recipe, _ := genkit.GenerateData[Recipe](ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Create a recipe for chocolate chip cookies."),
 )
 fmt.Printf("Recipe: %s\n", recipe.Title)
@@ -112,7 +112,7 @@ Stream text as it's generated for responsive user experiences:
 
 ```go
 stream := genkit.GenerateStream(ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Write a short story about a robot learning to paint."),
 )
 
@@ -145,7 +145,7 @@ type Recipe struct {
 }
 
 stream := genkit.GenerateDataStream[*Recipe](ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Create a recipe for spaghetti carbonara."),
 )
 
@@ -184,7 +184,7 @@ weatherTool := genkit.DefineTool(g, "getWeather",
 )
 
 response, _ := genkit.Generate(ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("What's the weather like in San Francisco?"),
     ai.WithTools(weatherTool),
 )
@@ -226,7 +226,7 @@ transferTool := genkit.DefineTool(g, "transfer",
 
 // Handle interrupts in your flow
 resp, _ := genkit.Generate(ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Transfer $5000 to account ABC123"),
     ai.WithTools(transferTool),
 )
@@ -248,6 +248,60 @@ if resp.FinishReason == ai.FinishReasonInterrupted {
 
 [See full example](samples/intermediate-interrupts)
 
+### Middleware
+
+Middleware wraps generation, model calls, and tool execution to add cross-cutting behavior without touching your flows. Register the `middleware` plugin during `Init` to expose the built-ins in the Dev UI, then attach them per call with `ai.WithUse`:
+
+```go
+import "github.com/firebase/genkit/go/plugins/middleware"
+
+g := genkit.Init(ctx, genkit.WithPlugins(
+    &googlegenai.GoogleAI{},
+    &middleware.Middleware{},
+))
+
+// Retry transient failures, then fall back to a secondary model if the primary
+// stays down. Middleware composes outer-to-inner: Retry { Fallback { model } }.
+response, _ := genkit.Generate(ctx, g,
+    ai.WithModelName("googleai/gemini-flash-latest"),
+    ai.WithPrompt("Explain quantum computing."),
+    ai.WithUse(
+        &middleware.Retry{MaxRetries: 3},
+        &middleware.Fallback{Models: []ai.ModelRef{
+            googlegenai.ModelRef("googleai/gemini-3.1-flash", nil),
+        }},
+    ),
+)
+```
+
+The `middleware` plugin also ships with [`ToolApproval`](plugins/middleware/tool_approval.go) for human-in-the-loop gating, [`Filesystem`](samples/basic-middleware/filesystem) for sandboxed file access, and [`Skills`](samples/basic-middleware/skills) for loadable `SKILL.md` skills. [See the retry + fallback sample](samples/basic-middleware/retry-fallback) for the full composition.
+
+### Custom Middleware
+
+Implement the `ai.Middleware` interface to build your own. Embed `ai.BaseMiddleware` to inherit pass-through defaults for the hooks you don't need, then override `WrapGenerate`, `WrapModel`, or `WrapTool`:
+
+```go
+type Logger struct {
+    ai.BaseMiddleware
+    Prefix string `json:"prefix,omitempty"`
+}
+
+func (l *Logger) Name() string      { return "mine/logger" }
+func (l *Logger) New() ai.Middleware { return &Logger{Prefix: l.Prefix} }
+
+func (l *Logger) WrapModel(ctx context.Context, params *ai.ModelParams, next ai.ModelNext) (*ai.ModelResponse, error) {
+    start := time.Now()
+    resp, err := next(ctx, params)
+    log.Printf("%s model call took %s", l.Prefix, time.Since(start))
+    return resp, err
+}
+
+// Use it like any built-in middleware.
+ai.WithUse(&Logger{Prefix: "[trace]"})
+```
+
+`New()` is called once per `Generate` invocation, so middleware can hold per-call state without worrying about concurrent use across calls. `Name()` must be unique and stable since it's the key used to register and reference the middleware from the Dev UI and across runtimes.
+
 ### Define Flows
 
 Wrap your AI logic in flows for better observability, testing, and deployment:
@@ -256,7 +310,7 @@ Wrap your AI logic in flows for better observability, testing, and deployment:
 jokeFlow := genkit.DefineFlow(g, "tellJoke",
     func(ctx context.Context, topic string) (string, error) {
         return genkit.GenerateText(ctx, g,
-            ai.WithModelName("googleai/gemini-2.5-flash"),
+            ai.WithModelName("googleai/gemini-flash-latest"),
             ai.WithPrompt("Tell me a joke about %s", topic),
         )
     },
@@ -276,7 +330,7 @@ Stream data from your flows using Server-Sent Events (SSE):
 genkit.DefineStreamingFlow(g, "streamStory",
     func(ctx context.Context, topic string, send core.StreamCallback[string]) (string, error) {
         stream := genkit.GenerateStream(ctx, g,
-            ai.WithModelName("googleai/gemini-2.5-flash"),
+            ai.WithModelName("googleai/gemini-flash-latest"),
             ai.WithPrompt("Write a story about %s", topic),
         )
 
@@ -306,14 +360,14 @@ genkit.DefineFlow(g, "processDocument",
         // Each Run call creates a traced step visible in the Dev UI
         summary, _ := genkit.Run(ctx, "summarize", func() (string, error) {
             return genkit.GenerateText(ctx, g,
-                ai.WithModelName("googleai/gemini-2.5-flash"),
+                ai.WithModelName("googleai/gemini-flash-latest"),
                 ai.WithPrompt("Summarize: %s", doc),
             )
         })
 
         keywords, _ := genkit.Run(ctx, "extractKeywords", func() ([]string, error) {
             return genkit.GenerateData[[]string](ctx, g,
-                ai.WithModelName("googleai/gemini-2.5-flash"),
+                ai.WithModelName("googleai/gemini-flash-latest"),
                 ai.WithPrompt("Extract keywords from: %s", summary),
             )
         })
@@ -331,7 +385,7 @@ Create reusable prompts with Handlebars templating:
 
 ```go
 greetingPrompt := genkit.DefinePrompt(g, "greeting",
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Write a {{style}} greeting for {{name}}."),
 )
 
@@ -359,7 +413,7 @@ type Joke struct {
 }
 
 jokePrompt := genkit.DefineDataPrompt[JokeRequest, *Joke](g, "joke",
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Tell a joke about {{topic}}."),
 )
 
@@ -387,7 +441,7 @@ Keep prompts separate from code using `.prompt` files with YAML frontmatter:
 ```yaml
 # prompts/recipe.prompt
 ---
-model: googleai/gemini-2.5-flash
+model: googleai/gemini-flash-latest
 input:
   schema: RecipeRequest
 output:
@@ -553,13 +607,13 @@ import "google.golang.org/genai"
 
 // Simple: just the model name
 response, _ := genkit.Generate(ctx, g,
-    ai.WithModelName("googleai/gemini-2.5-flash"),
+    ai.WithModelName("googleai/gemini-flash-latest"),
     ai.WithPrompt("Hello!"),
 )
 
 // Advanced: model name + provider-specific configuration
 response, _ := genkit.Generate(ctx, g,
-    ai.WithModel(googlegenai.ModelRef("googleai/gemini-2.5-flash", &genai.GenerateContentConfig{
+    ai.WithModel(googlegenai.ModelRef("googleai/gemini-flash-latest", &genai.GenerateContentConfig{
         Temperature:     genai.Ptr(float32(0.7)),
         MaxOutputTokens: genai.Ptr(int32(1000)),
         TopP:            genai.Ptr(float32(0.9)),
@@ -657,6 +711,9 @@ Explore working examples to see Genkit in action:
 | [basic-structured](samples/basic-structured) | Typed JSON output with `GenerateData` and `GenerateDataStream` |
 | [basic-prompts](samples/basic-prompts) | Prompt templates with Handlebars and `.prompt` files |
 | [intermediate-interrupts](samples/intermediate-interrupts) | Human-in-the-loop with tool interrupts |
+| [basic-middleware/retry-fallback](samples/basic-middleware/retry-fallback) | Composing `Retry` and `Fallback` middleware |
+| [basic-middleware/filesystem](samples/basic-middleware/filesystem) | Scoped filesystem tools for the model |
+| [basic-middleware/skills](samples/basic-middleware/skills) | On-demand loadable `SKILL.md` personas |
 | [prompts-embed](samples/prompts-embed) | Embed prompts in your binary |
 | [durable-streaming](samples/durable-streaming) | Reconnectable streams with replay |
 | [session](samples/session) | Stateful flows with typed session data |
 
@@ -19,6 +19,8 @@ package ai
 import (
 	"encoding/json"
 	"fmt"
+	"maps"
+	"slices"
 	"strings"
 )
 
@@ -44,6 +46,31 @@ type Part struct {
 	Metadata     map[string]any `json:"metadata,omitempty"`     // valid for all kinds
 }
 
+// Clone returns a shallow copy of the Part with its own Metadata and Custom
+// maps. Callers can add or remove map keys without mutating the original.
+func (p *Part) Clone() *Part {
+	if p == nil {
+		return nil
+	}
+	cp := *p
+	cp.Custom = maps.Clone(p.Custom)
+	cp.Metadata = maps.Clone(p.Metadata)
+	return &cp
+}
+
+// Clone returns a shallow copy of the Message with its own Content slice
+// and Metadata map. Callers can replace parts or add metadata keys without
+// mutating the original.
+func (m *Message) Clone() *Message {
+	if m == nil {
+		return nil
+	}
+	cp := *m
+	cp.Content = slices.Clone(m.Content)
+	cp.Metadata = maps.Clone(m.Metadata)
+	return &cp
+}
+
 type PartKind int8
 
 const (
 
@@ -17,6 +17,7 @@
 package ai
 
 import (
+	"bytes"
 	"encoding/json"
 	"reflect"
 	"testing"
@@ -411,3 +412,108 @@ func TestNewResponseForToolRequest(t *testing.T) {
 		}
 	})
 }
+
+// TestPartClone verifies that Part.Clone produces an independent copy.
+// Every Part field is populated so that adding a new field without updating
+// this test (and Clone) causes a failure.
+func TestPartClone(t *testing.T) {
+	orig := &Part{
+		Kind:        PartToolRequest,
+		ContentType: "application/json",
+		Text:        "body",
+		ToolRequest: &ToolRequest{Name: "tool", Input: map[string]any{"a": 1}},
+		// Normally a Part wouldn't have both ToolRequest and ToolResponse,
+		// but we populate everything to catch missing fields.
+		ToolResponse: &ToolResponse{Name: "tool", Output: "ok"},
+		Resource:     &ResourcePart{Uri: "res://x"},
+		Custom:       map[string]any{"ck": "cv"},
+		Metadata:     map[string]any{"sig": []byte{1, 2, 3}, "key": "val"},
+	}
+
+	// Guard: every field in the fixture must be non-zero.
+	// If someone adds a new field to Part this will fail, forcing them to
+	// add it here and verify Clone handles it.
+	rv := reflect.ValueOf(orig).Elem()
+	for i := range rv.NumField() {
+		if rv.Field(i).IsZero() {
+			t.Fatalf("Part field %q is zero in test fixture — populate it and verify Clone handles it", rv.Type().Field(i).Name)
+		}
+	}
+
+	cp := orig.Clone()
+
+	// Values must match.
+	if !reflect.DeepEqual(orig, cp) {
+		t.Fatal("Clone() values differ from original")
+	}
+
+	// Mutating clone's maps must not affect the original.
+	cp.Metadata["extra"] = true
+	if _, ok := orig.Metadata["extra"]; ok {
+		t.Error("mutating clone Metadata affected original")
+	}
+
+	cp.Custom["extra"] = true
+	if _, ok := orig.Custom["extra"]; ok {
+		t.Error("mutating clone Custom affected original")
+	}
+
+	// Go types in metadata (e.g. []byte) must be preserved, not string-ified.
+	sig, ok := cp.Metadata["sig"].([]byte)
+	if !ok {
+		t.Fatalf("Metadata[sig] type = %T, want []byte", cp.Metadata["sig"])
+	}
+	if !bytes.Equal(sig, []byte{1, 2, 3}) {
+		t.Errorf("Metadata[sig] = %v, want [1 2 3]", sig)
+	}
+
+	// nil Part.Clone() should return nil.
+	var nilPart *Part
+	if nilPart.Clone() != nil {
+		t.Error("nil Part.Clone() should return nil")
+	}
+}
+
+// TestMessageClone verifies that Message.Clone produces an independent copy.
+// Every Message field is populated so that adding a new field without updating
+// this test (and Clone) causes a failure.
+func TestMessageClone(t *testing.T) {
+	orig := &Message{
+		Role:     RoleModel,
+		Content:  []*Part{NewTextPart("hello"), NewTextPart("world")},
+		Metadata: map[string]any{"k": "v"},
+	}
+
+	// Guard: every field must be non-zero.
+	rv := reflect.ValueOf(orig).Elem()
+	for i := range rv.NumField() {
+		if rv.Field(i).IsZero() {
+			t.Fatalf("Message field %q is zero in test fixture — populate it and verify Clone handles it", rv.Type().Field(i).Name)
+		}
+	}
+
+	cp := orig.Clone()
+
+	// Values must match.
+	if !reflect.DeepEqual(orig, cp) {
+		t.Fatal("Clone() values differ from original")
+	}
+
+	// Mutating clone's Content slice must not affect the original.
+	cp.Content[0] = NewTextPart("replaced")
+	if orig.Content[0].Text != "hello" {
+		t.Error("mutating clone Content affected original")
+	}
+
+	// Mutating clone's Metadata must not affect the original.
+	cp.Metadata["extra"] = true
+	if _, ok := orig.Metadata["extra"]; ok {
+		t.Error("mutating clone Metadata affected original")
+	}
+
+	// nil Message.Clone() should return nil.
+	var nilMsg *Message
+	if nilMsg.Clone() != nil {
+		t.Error("nil Message.Clone() should return nil")
+	}
+}