feat: manually mirror opencoze's code from bytedance
Change-Id: I09a73aadda978ad9511264a756b2ce51f5761adf
This commit is contained in:
@@ -0,0 +1,212 @@
|
||||
/*
|
||||
* Copyright 2025 coze-dev Authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
package intentdetector
|
||||
|
||||
import (
|
||||
"context"
|
||||
"encoding/json"
|
||||
"errors"
|
||||
"strconv"
|
||||
"strings"
|
||||
|
||||
"github.com/cloudwego/eino/components/model"
|
||||
"github.com/cloudwego/eino/components/prompt"
|
||||
"github.com/cloudwego/eino/compose"
|
||||
"github.com/cloudwego/eino/schema"
|
||||
"github.com/spf13/cast"
|
||||
|
||||
"github.com/coze-dev/coze-studio/backend/domain/workflow/internal/nodes"
|
||||
"github.com/coze-dev/coze-studio/backend/pkg/lang/ternary"
|
||||
)
|
||||
|
||||
type Config struct {
|
||||
Intents []string
|
||||
SystemPrompt string
|
||||
IsFastMode bool
|
||||
ChatModel model.BaseChatModel
|
||||
}
|
||||
|
||||
const SystemIntentPrompt = `
|
||||
# Role
|
||||
You are an intention classification expert, good at being able to judge which classification the user's input belongs to.
|
||||
|
||||
## Skills
|
||||
Skill 1: Clearly determine which of the following intention classifications the user's input belongs to.
|
||||
Intention classification list:
|
||||
[
|
||||
{"classificationId": 0, "content": "Other intentions"},
|
||||
{{intents}}
|
||||
]
|
||||
|
||||
Note:
|
||||
- Please determine the match only between the user's input content and the Intention classification list content, without judging or categorizing the match with the classification ID.
|
||||
|
||||
{{advance}}
|
||||
|
||||
## Reply requirements
|
||||
- The answer must be returned in JSON format.
|
||||
- Strictly ensure that the output is in a valid JSON format.
|
||||
- Do not add prefix "json or suffix""
|
||||
- The answer needs to include the following fields such as:
|
||||
{
|
||||
"classificationId": 0,
|
||||
"reason": "Unclear intentions"
|
||||
}
|
||||
|
||||
##Limit
|
||||
- Please do not reply in text.
|
||||
`
|
||||
|
||||
const FastModeSystemIntentPrompt = `
|
||||
# Role
|
||||
You are an intention classification expert, good at being able to judge which classification the user's input belongs to.
|
||||
|
||||
## Skills
|
||||
Skill 1: Clearly determine which of the following intention classifications the user's input belongs to.
|
||||
Intention classification list:
|
||||
[
|
||||
{"classificationId": 0, "content": "Other intentions"},
|
||||
{{intents}}
|
||||
]
|
||||
|
||||
Note:
|
||||
- Please determine the match only between the user's input content and the Intention classification list content, without judging or categorizing the match with the classification ID.
|
||||
|
||||
|
||||
## Reply requirements
|
||||
- The answer must be a number indicated classificationId.
|
||||
- if not match, please just output an number 0.
|
||||
- do not output json format data, just output an number.
|
||||
|
||||
##Limit
|
||||
- Please do not reply in text.`
|
||||
|
||||
type IntentDetector struct {
|
||||
config *Config
|
||||
runner compose.Runnable[map[string]any, *schema.Message]
|
||||
}
|
||||
|
||||
func NewIntentDetector(ctx context.Context, cfg *Config) (*IntentDetector, error) {
|
||||
if cfg == nil {
|
||||
return nil, errors.New("cfg is required")
|
||||
}
|
||||
if !cfg.IsFastMode && cfg.ChatModel == nil {
|
||||
return nil, errors.New("config chat model is required")
|
||||
}
|
||||
|
||||
if len(cfg.Intents) == 0 {
|
||||
return nil, errors.New("config intents is required")
|
||||
}
|
||||
chain := compose.NewChain[map[string]any, *schema.Message]()
|
||||
|
||||
spt := ternary.IFElse[string](cfg.IsFastMode, FastModeSystemIntentPrompt, SystemIntentPrompt)
|
||||
|
||||
sptTemplate, err := nodes.TemplateRender(spt, map[string]interface{}{
|
||||
"intents": toIntentString(cfg.Intents),
|
||||
})
|
||||
if err != nil {
|
||||
return nil, err
|
||||
}
|
||||
prompts := prompt.FromMessages(schema.Jinja2,
|
||||
&schema.Message{Content: sptTemplate, Role: schema.System},
|
||||
&schema.Message{Content: "{{query}}", Role: schema.User})
|
||||
|
||||
r, err := chain.AppendChatTemplate(prompts).AppendChatModel(cfg.ChatModel).Compile(ctx)
|
||||
if err != nil {
|
||||
return nil, err
|
||||
}
|
||||
return &IntentDetector{
|
||||
config: cfg,
|
||||
runner: r,
|
||||
}, nil
|
||||
}
|
||||
|
||||
func (id *IntentDetector) parseToNodeOut(content string) (map[string]any, error) {
|
||||
nodeOutput := make(map[string]any)
|
||||
nodeOutput["classificationId"] = 0
|
||||
if content == "" {
|
||||
return nodeOutput, errors.New("content is empty")
|
||||
}
|
||||
|
||||
if id.config.IsFastMode {
|
||||
cid, err := strconv.ParseInt(content, 10, 64)
|
||||
if err != nil {
|
||||
return nodeOutput, err
|
||||
}
|
||||
nodeOutput["classificationId"] = cid
|
||||
return nodeOutput, nil
|
||||
}
|
||||
|
||||
leftIndex := strings.Index(content, "{")
|
||||
rightIndex := strings.Index(content, "}")
|
||||
if leftIndex == -1 || rightIndex == -1 {
|
||||
return nodeOutput, errors.New("content is invalid")
|
||||
}
|
||||
|
||||
err := json.Unmarshal([]byte(content[leftIndex:rightIndex+1]), &nodeOutput)
|
||||
if err != nil {
|
||||
return nodeOutput, err
|
||||
}
|
||||
|
||||
return nodeOutput, nil
|
||||
}
|
||||
|
||||
func (id *IntentDetector) Invoke(ctx context.Context, input map[string]any) (map[string]any, error) {
|
||||
query, ok := input["query"]
|
||||
if !ok {
|
||||
return nil, errors.New("input query field required")
|
||||
}
|
||||
|
||||
queryStr, ok := query.(string)
|
||||
if !ok {
|
||||
queryStr = cast.ToString(query)
|
||||
}
|
||||
|
||||
vars := make(map[string]any)
|
||||
vars["query"] = queryStr
|
||||
if !id.config.IsFastMode {
|
||||
ad, err := nodes.TemplateRender(id.config.SystemPrompt, map[string]any{"query": query})
|
||||
if err != nil {
|
||||
return nil, err
|
||||
}
|
||||
vars["advance"] = ad
|
||||
}
|
||||
o, err := id.runner.Invoke(ctx, vars)
|
||||
if err != nil {
|
||||
return nil, err
|
||||
}
|
||||
|
||||
return id.parseToNodeOut(o.Content)
|
||||
}
|
||||
|
||||
func toIntentString(its []string) string {
|
||||
type IntentVariableItem struct {
|
||||
ClassificationID int64 `json:"classificationId"`
|
||||
Content string `json:"content"`
|
||||
}
|
||||
|
||||
vs := make([]*IntentVariableItem, 0, len(its))
|
||||
|
||||
for idx, it := range its {
|
||||
vs = append(vs, &IntentVariableItem{
|
||||
ClassificationID: int64(idx + 1),
|
||||
Content: it,
|
||||
})
|
||||
}
|
||||
itsBytes, _ := json.Marshal(vs)
|
||||
return string(itsBytes)
|
||||
}
|
||||
@@ -0,0 +1,88 @@
|
||||
/*
|
||||
* Copyright 2025 coze-dev Authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
package intentdetector
|
||||
|
||||
import (
|
||||
"context"
|
||||
"fmt"
|
||||
"testing"
|
||||
|
||||
"github.com/cloudwego/eino/components/model"
|
||||
"github.com/cloudwego/eino/schema"
|
||||
"github.com/stretchr/testify/assert"
|
||||
)
|
||||
|
||||
type mockChatModel struct {
|
||||
topSeed bool
|
||||
}
|
||||
|
||||
func (m mockChatModel) Generate(ctx context.Context, input []*schema.Message, opts ...model.Option) (*schema.Message, error) {
|
||||
if m.topSeed {
|
||||
return &schema.Message{
|
||||
Content: "1",
|
||||
}, nil
|
||||
}
|
||||
return &schema.Message{
|
||||
Content: `{"classificationId":1,"reason":"高兴"}`,
|
||||
}, nil
|
||||
}
|
||||
|
||||
func (m mockChatModel) Stream(ctx context.Context, input []*schema.Message, opts ...model.Option) (*schema.StreamReader[*schema.Message], error) {
|
||||
return nil, nil
|
||||
}
|
||||
|
||||
func (m mockChatModel) BindTools(tools []*schema.ToolInfo) error {
|
||||
return nil
|
||||
}
|
||||
|
||||
func TestNewIntentDetector(t *testing.T) {
|
||||
ctx := context.Background()
|
||||
t.Run("fast mode", func(t *testing.T) {
|
||||
dt, err := NewIntentDetector(ctx, &Config{
|
||||
Intents: []string{"高兴", "悲伤"},
|
||||
IsFastMode: true,
|
||||
ChatModel: &mockChatModel{topSeed: true},
|
||||
})
|
||||
assert.Nil(t, err)
|
||||
|
||||
ret, err := dt.Invoke(ctx, map[string]any{
|
||||
"query": "我考了100分",
|
||||
})
|
||||
assert.Nil(t, err)
|
||||
assert.Equal(t, ret["classificationId"], int64(1))
|
||||
})
|
||||
|
||||
t.Run("full mode", func(t *testing.T) {
|
||||
|
||||
dt, err := NewIntentDetector(ctx, &Config{
|
||||
Intents: []string{"高兴", "悲伤"},
|
||||
IsFastMode: false,
|
||||
ChatModel: &mockChatModel{},
|
||||
})
|
||||
assert.Nil(t, err)
|
||||
|
||||
ret, err := dt.Invoke(ctx, map[string]any{
|
||||
"query": "我考了100分",
|
||||
})
|
||||
fmt.Println(err)
|
||||
assert.Nil(t, err)
|
||||
fmt.Println(ret)
|
||||
assert.Equal(t, ret["classificationId"], float64(1))
|
||||
assert.Equal(t, ret["reason"], "高兴")
|
||||
})
|
||||
|
||||
}
|
||||
Reference in New Issue
Block a user