feat(tool): json fix tool middleware

Change-Id: I00d90a0d23b68faccad77337aa1b511e22862b28
drew/english
shentong.martin 5 months ago committed by shentongmartin
parent 589b192304
commit a18a2c0538

@ -0,0 +1,75 @@
/*
* Copyright 2025 CloudWeGo Authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// This example shows how to configure the jsonfix middleware on a ToolsNode
// to repair invalid JSON arguments before invoking a local tool.
// Run: go run ./components/tool/middlewares/jsonfix/example
package main
import (
"context"
"fmt"
"github.com/cloudwego/eino/components/tool"
"github.com/cloudwego/eino/components/tool/utils"
"github.com/cloudwego/eino/compose"
"github.com/cloudwego/eino/schema"
jsonfix "github.com/cloudwego/eino-examples/components/tool/middlewares/jsonfix"
)
type greetReq struct {
Name string `json:"name"`
}
type greetResp struct {
Greeting string `json:"greeting"`
}
func main() {
ctx := context.Background()
// Define a simple local tool with JSON input/output using InferTool.
greeter, _ := utils.InferTool("greeter", "greet by name", func(ctx context.Context, in *greetReq) (*greetResp, error) {
return &greetResp{Greeting: "Hello, " + in.Name}, nil
})
// Create ToolsNode and register the jsonfix middleware.
tn, _ := compose.NewToolNode(ctx, &compose.ToolsNodeConfig{
Tools: []tool.BaseTool{greeter},
ToolCallMiddlewares: []compose.ToolMiddleware{jsonfix.Middleware()},
})
// Craft an Assistant message with an invalid JSON argument to simulate LLM output.
msg := schema.AssistantMessage("", nil)
msg.ToolCalls = []schema.ToolCall{{
ID: "1",
Function: schema.FunctionCall{
Name: "greeter",
Arguments: "noise <|FunctionCallBegin|>{\"name\":\"Alice\"1\"\"}<|FunctionCallEnd|>",
},
}}
// ToolsNode invokes the tool. Middleware repairs the argument first.
outs, err := tn.Invoke(ctx, msg)
if err != nil {
fmt.Println("error:", err)
return
}
for _, o := range outs {
fmt.Println("tool:", o.ToolName, "id:", o.ToolCallID, "content:", o.Content)
}
}

@ -0,0 +1,113 @@
/*
* Copyright 2025 CloudWeGo Authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// Package jsonfix provides a ToolMiddleware for Eino's ToolsNode that
// repairs malformed JSON arguments produced by LLMs before tool execution.
//
// Usage:
//
// conf := &compose.ToolsNodeConfig{
// Tools: []tool.BaseTool{yourTool},
// ToolCallMiddlewares: []compose.ToolMiddleware{jsonfix.Middleware()},
// }
//
// Behavior:
// - Fast-path returns original arguments when already valid JSON.
// - Strips common LLM artifacts and isolates the first {...} region.
// - Applies robust fix using jsonrepair only when input is invalid.
// - Safe for both invokable and streamable tools.
package jsonfix
import (
"context"
"encoding/json"
"strings"
"github.com/cloudwego/eino/compose"
"github.com/kaptinlin/jsonrepair"
)
// FixJSON is a helper endpoint that returns repaired JSON for diagnostics
// or standalone use. ToolsNode should prefer Invokable/Streamable middleware.
func FixJSON(ctx context.Context, in *compose.ToolInput) (*compose.ToolOutput, error) {
fixed := repair(in.Arguments)
return &compose.ToolOutput{Result: fixed}, nil
}
// Invokable wraps a non-stream tool endpoint to sanitize JSON arguments.
// Register via ToolCallMiddlewares to apply automatically to invokable tools.
func Invokable(next compose.InvokableToolEndpoint) compose.InvokableToolEndpoint {
return func(ctx context.Context, in *compose.ToolInput) (*compose.ToolOutput, error) {
in.Arguments = repair(in.Arguments)
return next(ctx, in)
}
}
// Streamable wraps a stream tool endpoint to sanitize JSON arguments.
// Register via ToolCallMiddlewares to apply automatically to streamable tools.
func Streamable(next compose.StreamableToolEndpoint) compose.StreamableToolEndpoint {
return func(ctx context.Context, in *compose.ToolInput) (*compose.StreamToolOutput, error) {
in.Arguments = repair(in.Arguments)
return next(ctx, in)
}
}
// Middleware bundles both invokable and streamable wrappers for convenience.
func Middleware() compose.ToolMiddleware {
return compose.ToolMiddleware{Invokable: Invokable, Streamable: Streamable}
}
// repair attempts minimal work first (validity check, region isolation) and
// only uses jsonrepair when necessary. It trims common LLM artifacts.
func repair(input string) string {
s := strings.TrimSpace(input)
// Fast-path: valid JSON as-is
if strings.HasPrefix(s, "{") && strings.HasSuffix(s, "}") && json.Valid([]byte(s)) {
return s
}
// Isolate JSON object region if present; strip noise if object-only is valid
i := strings.IndexByte(s, '{')
j := strings.LastIndexByte(s, '}')
if i >= 0 && j >= i {
sub := s[i : j+1]
if json.Valid([]byte(sub)) {
return sub
}
s = sub
}
// Remove common LLM artifacts
s = strings.TrimPrefix(s, "<|FunctionCallBegin|>")
s = strings.TrimSuffix(s, "<|FunctionCallEnd|>")
s = strings.TrimPrefix(s, "<think>")
// Attempt robust repair only when invalid
if json.Valid([]byte(s)) {
return s
}
// Heuristic: add missing leading/trailing brace if one side exists
if !strings.HasPrefix(s, "{") && strings.HasSuffix(s, "}") {
s = "{" + s
} else if strings.HasPrefix(s, "{") && !strings.HasSuffix(s, "}") {
s = s + "}"
}
out, err := jsonrepair.JSONRepair(s)
if err != nil {
return s
}
return out
}

@ -0,0 +1,185 @@
/*
* Copyright 2025 CloudWeGo Authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package jsonfix
import (
"context"
"encoding/json"
"testing"
"github.com/cloudwego/eino/components/tool"
"github.com/cloudwego/eino/compose"
"github.com/cloudwego/eino/schema"
)
func echoEndpoint(_ context.Context, in *compose.ToolInput) (*compose.ToolOutput, error) {
return &compose.ToolOutput{Result: in.Arguments}, nil
}
func TestInvokableMiddleware_RepairsJSON(t *testing.T) {
mw := Invokable
chained := mw(echoEndpoint)
input := &compose.ToolInput{
Name: "test_tool",
Arguments: "noise <|FunctionCallBegin|>{\"a\":1}<|FunctionCallEnd|> more",
CallID: "id1",
}
out, err := chained(context.Background(), input)
if err != nil {
t.Fatalf("err: %v", err)
}
var m map[string]int
if e := json.Unmarshal([]byte(out.Result), &m); e != nil || m["a"] != 1 {
t.Fatalf("repair failed: %v %v", out.Result, e)
}
}
func TestStreamableMiddleware_RepairsJSON(t *testing.T) {
mw := Streamable
var captured string
next := func(_ context.Context, in *compose.ToolInput) (*compose.StreamToolOutput, error) {
captured = in.Arguments
return &compose.StreamToolOutput{Result: schema.StreamReaderFromArray([]string{"ok"})}, nil
}
chained := mw(next)
_, err := chained(context.Background(), &compose.ToolInput{Name: "t", Arguments: "{\"text\": \"He said \"hello\" to me\"}"})
if err != nil {
t.Fatalf("err: %v", err)
}
var m map[string]string
if e := json.Unmarshal([]byte(captured), &m); e != nil || m["text"] != "He said \"hello\" to me" {
t.Fatalf("repair failed: %v %v", captured, e)
}
}
func TestInvokableMiddleware_NoChangeForValidJSON(t *testing.T) {
mw := Invokable
chained := mw(echoEndpoint)
original := "{\"a\":1}"
out, err := chained(context.Background(), &compose.ToolInput{Name: "t", Arguments: original})
if err != nil {
t.Fatalf("err: %v", err)
}
if out.Result != original {
t.Fatalf("should not change valid json: got %s", out.Result)
}
}
func TestInvokableMiddleware_MissingBracesAndUnicode(t *testing.T) {
mw := Invokable
chained := mw(echoEndpoint)
inputs := []string{
"{\"key\":\"value\"", // missing tail
"\"key\":\"value\"}", // missing head
"{\"emoji\": \"😀😎\"}",
"{\"text\": \"line1\nline2\tTabbed\"}",
}
for _, in := range inputs {
out, err := chained(context.Background(), &compose.ToolInput{Name: "t", Arguments: in})
if err != nil {
t.Fatalf("err: %v", err)
}
var any map[string]string
if e := json.Unmarshal([]byte(out.Result), &any); e != nil {
t.Fatalf("unmarshal failed: %v for %v", e, out.Result)
}
}
}
type spyInvokable struct{}
func (s *spyInvokable) Info(_ context.Context) (*schema.ToolInfo, error) {
return &schema.ToolInfo{Name: "spy", Desc: ""}, nil
}
func (s *spyInvokable) InvokableRun(_ context.Context, argumentsInJSON string, _ ...tool.Option) (string, error) {
return argumentsInJSON, nil
}
func TestToolsNodeMiddleware_RepairsInvokable(t *testing.T) {
tn, err := compose.NewToolNode(context.Background(), &compose.ToolsNodeConfig{
Tools: []tool.BaseTool{&spyInvokable{}},
ToolCallMiddlewares: []compose.ToolMiddleware{Middleware()},
})
if err != nil {
t.Fatalf("new tools node err: %v", err)
}
msg := schema.AssistantMessage("", nil)
msg.ToolCalls = []schema.ToolCall{{
ID: "1",
Function: schema.FunctionCall{Name: "spy", Arguments: "garbage {\"x\": \"a \"quote\" b\"} tail"},
}}
outs, err := tn.Invoke(context.Background(), msg)
if err != nil {
t.Fatalf("invoke err: %v", err)
}
if len(outs) != 1 {
t.Fatalf("unexpected outs: %d", len(outs))
}
var m map[string]string
if e := json.Unmarshal([]byte(outs[0].Content), &m); e != nil || m["x"] != "a \"quote\" b" {
t.Fatalf("repair failed: %v %v", outs[0].Content, e)
}
}
func TestInvokableMiddleware_UnescapedBackslashesAndSingleQuotesAndTrailingComma(t *testing.T) {
mw := Invokable
chained := mw(echoEndpoint)
cases := []string{
// unescaped backslashes in Windows path
"{\"path\": \"C:\\Users\\name\\file.txt\"}",
// single-quoted JSON
"{'a': 'b'}",
// trailing comma
"{\"a\": 1, \"b\": 2, }",
}
for _, in := range cases {
out, err := chained(context.Background(), &compose.ToolInput{Name: "t", Arguments: in})
if err != nil {
t.Fatalf("err: %v", err)
}
var any map[string]any
if e := json.Unmarshal([]byte(out.Result), &any); e != nil {
t.Fatalf("unmarshal failed: %v for %v", e, out.Result)
}
}
}
func TestInvokableMiddleware_RawQuotesInsideStringValue(t *testing.T) {
mw := Invokable
chained := mw(echoEndpoint)
// invalid JSON: raw quotes inside value
in := "{\"a\":\"b\"1\"\"}"
out, err := chained(context.Background(), &compose.ToolInput{Name: "t", Arguments: in})
if err != nil {
t.Fatalf("err: %v", err)
}
var m map[string]string
if e := json.Unmarshal([]byte(out.Result), &m); e != nil {
t.Fatalf("unmarshal failed: %v for %v", e, out.Result)
}
v := m["a"]
if v == "" || v[0] != 'b' {
t.Fatalf("unexpected repaired value: %q", v)
}
}
Loading…
Cancel
Save