88 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			Go
		
	
	
	
			
		
		
	
	
			88 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			Go
		
	
	
	
/*
 | 
						|
 * Copyright 2025 coze-dev Authors
 | 
						|
 *
 | 
						|
 * Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
 * you may not use this file except in compliance with the License.
 | 
						|
 * You may obtain a copy of the License at
 | 
						|
 *
 | 
						|
 *     http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
 *
 | 
						|
 * Unless required by applicable law or agreed to in writing, software
 | 
						|
 * distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
 * See the License for the specific language governing permissions and
 | 
						|
 * limitations under the License.
 | 
						|
 */
 | 
						|
 | 
						|
package impl
 | 
						|
 | 
						|
import (
 | 
						|
	"context"
 | 
						|
 | 
						|
	"github.com/coze-dev/coze-studio/backend/api/model/crossdomain/knowledge"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/domain/knowledge/entity"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/domain/knowledge/processor"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/domain/knowledge/repository"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/infra/contract/document/parser"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/infra/contract/eventbus"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/infra/contract/idgen"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/infra/contract/rdb"
 | 
						|
	"github.com/coze-dev/coze-studio/backend/infra/contract/storage"
 | 
						|
)
 | 
						|
 | 
						|
type DocProcessorConfig struct {
 | 
						|
	UserID         int64
 | 
						|
	SpaceID        int64
 | 
						|
	DocumentSource entity.DocumentSource
 | 
						|
	Documents      []*entity.Document
 | 
						|
 | 
						|
	KnowledgeRepo repository.KnowledgeRepo
 | 
						|
	DocumentRepo  repository.KnowledgeDocumentRepo
 | 
						|
	SliceRepo     repository.KnowledgeDocumentSliceRepo
 | 
						|
	Idgen         idgen.IDGenerator
 | 
						|
	Storage       storage.Storage
 | 
						|
	Rdb           rdb.RDB
 | 
						|
	Producer      eventbus.Producer
 | 
						|
	ParseManager  parser.Manager
 | 
						|
}
 | 
						|
 | 
						|
func NewDocProcessor(ctx context.Context, config *DocProcessorConfig) (p processor.DocProcessor) {
 | 
						|
	base := &baseDocProcessor{
 | 
						|
		ctx:            ctx,
 | 
						|
		UserID:         config.UserID,
 | 
						|
		SpaceID:        config.SpaceID,
 | 
						|
		Documents:      config.Documents,
 | 
						|
		documentSource: &config.DocumentSource,
 | 
						|
		knowledgeRepo:  config.KnowledgeRepo,
 | 
						|
		documentRepo:   config.DocumentRepo,
 | 
						|
		sliceRepo:      config.SliceRepo,
 | 
						|
		storage:        config.Storage,
 | 
						|
		idgen:          config.Idgen,
 | 
						|
		rdb:            config.Rdb,
 | 
						|
		producer:       config.Producer,
 | 
						|
		parseManager:   config.ParseManager,
 | 
						|
	}
 | 
						|
 | 
						|
	switch config.DocumentSource {
 | 
						|
	case entity.DocumentSourceCustom:
 | 
						|
		p = &customDocProcessor{
 | 
						|
			baseDocProcessor: *base,
 | 
						|
		}
 | 
						|
		if config.Documents[0].Type == knowledge.DocumentTypeTable {
 | 
						|
			p = &customTableProcessor{
 | 
						|
				baseDocProcessor: *base,
 | 
						|
			}
 | 
						|
		}
 | 
						|
		return p
 | 
						|
	case entity.DocumentSourceLocal:
 | 
						|
		if config.Documents[0].Type == knowledge.DocumentTypeTable {
 | 
						|
			return &localTableProcessor{
 | 
						|
				baseDocProcessor: *base,
 | 
						|
			}
 | 
						|
		}
 | 
						|
		return base
 | 
						|
	default:
 | 
						|
		return base
 | 
						|
	}
 | 
						|
}
 |