feat(infra): integrate PaddleOCR's PP-StructureV3 as a document parser backend (#714)
This commit is contained in:
@@ -88,7 +88,7 @@ func TestParseXLSX(t *testing.T) {
|
||||
ChunkingStrategy: nil,
|
||||
}
|
||||
|
||||
pfn := parseXLSX(config)
|
||||
pfn := ParseXLSX(config)
|
||||
docs, err := pfn(ctx, reader, parser.WithExtraMeta(map[string]any{
|
||||
"document_id": int64(123),
|
||||
"knowledge_id": int64(456),
|
||||
@@ -159,7 +159,7 @@ func TestParseXLSXConvertColumnType(t *testing.T) {
|
||||
ChunkingStrategy: nil,
|
||||
}
|
||||
|
||||
pfn := parseXLSX(config)
|
||||
pfn := ParseXLSX(config)
|
||||
docs, err := pfn(ctx, reader, parser.WithExtraMeta(map[string]any{
|
||||
"document_id": int64(123),
|
||||
"knowledge_id": int64(456),
|
||||
|
||||
Reference in New Issue
Block a user