279 lines
9.4 KiB
Go
279 lines
9.4 KiB
Go
// Package service provides business logic implementations for WeKnora application
|
|
// This package contains service layer implementations that coordinate between
|
|
// repositories and handlers, applying business rules and transaction management
|
|
package service
|
|
|
|
import (
|
|
"context"
|
|
|
|
"knowlege-lsxd/internal/logger"
|
|
"knowlege-lsxd/internal/types"
|
|
"knowlege-lsxd/internal/types/interfaces"
|
|
)
|
|
|
|
// chunkService implements the ChunkService interface
|
|
// It provides operations for managing document chunks in the knowledge base
|
|
// Chunks are segments of documents that have been processed and prepared for indexing
|
|
type chunkService struct {
|
|
chunkRepository interfaces.ChunkRepository // Repository for chunk data persistence
|
|
kbRepository interfaces.KnowledgeBaseRepository
|
|
modelService interfaces.ModelService
|
|
}
|
|
|
|
// NewChunkService creates a new chunk service
|
|
// It initializes a service with the provided chunk repository
|
|
// Parameters:
|
|
// - chunkRepository: Repository for chunk operations
|
|
//
|
|
// Returns:
|
|
// - interfaces.ChunkService: Initialized chunk service implementation
|
|
func NewChunkService(
|
|
chunkRepository interfaces.ChunkRepository,
|
|
kbRepository interfaces.KnowledgeBaseRepository,
|
|
modelService interfaces.ModelService,
|
|
) interfaces.ChunkService {
|
|
return &chunkService{
|
|
chunkRepository: chunkRepository,
|
|
kbRepository: kbRepository,
|
|
modelService: modelService,
|
|
}
|
|
}
|
|
|
|
// CreateChunks creates multiple chunks
|
|
// This method persists a batch of document chunks to the repository
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - chunks: Slice of document chunks to create
|
|
//
|
|
// Returns:
|
|
// - error: Any error encountered during chunk creation
|
|
func (s *chunkService) CreateChunks(ctx context.Context, chunks []*types.Chunk) error {
|
|
logger.Info(ctx, "Start creating chunks")
|
|
logger.Infof(ctx, "Creating %d chunks", len(chunks))
|
|
|
|
err := s.chunkRepository.CreateChunks(ctx, chunks)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"chunk_count": len(chunks),
|
|
})
|
|
return err
|
|
}
|
|
|
|
logger.Info(ctx, "Chunks created successfully")
|
|
return nil
|
|
}
|
|
|
|
// GetChunkByID retrieves a chunk by its ID
|
|
// This method fetches a specific chunk using its ID and validates tenant access
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - knowledgeID: ID of the knowledge document containing the chunk
|
|
// - id: ID of the chunk to retrieve
|
|
//
|
|
// Returns:
|
|
// - *types.Chunk: Retrieved chunk if found
|
|
// - error: Any error encountered during retrieval
|
|
func (s *chunkService) GetChunkByID(ctx context.Context, knowledgeID string, id string) (*types.Chunk, error) {
|
|
logger.Info(ctx, "Start getting chunk by ID")
|
|
logger.Infof(ctx, "Getting chunk, ID: %s, knowledge ID: %s", id, knowledgeID)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
|
|
chunk, err := s.chunkRepository.GetChunkByID(ctx, tenantID, id)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"chunk_id": id,
|
|
"knowledge_id": knowledgeID,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return nil, err
|
|
}
|
|
|
|
logger.Info(ctx, "Chunk retrieved successfully")
|
|
return chunk, nil
|
|
}
|
|
|
|
// ListChunksByKnowledgeID lists all chunks for a knowledge ID
|
|
// This method retrieves all chunks belonging to a specific knowledge document
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - knowledgeID: ID of the knowledge document
|
|
//
|
|
// Returns:
|
|
// - []*types.Chunk: List of chunks belonging to the knowledge document
|
|
// - error: Any error encountered during retrieval
|
|
func (s *chunkService) ListChunksByKnowledgeID(ctx context.Context, knowledgeID string) ([]*types.Chunk, error) {
|
|
logger.Info(ctx, "Start listing chunks by knowledge ID")
|
|
logger.Infof(ctx, "Knowledge ID: %s", knowledgeID)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
|
|
chunks, err := s.chunkRepository.ListChunksByKnowledgeID(ctx, tenantID, knowledgeID)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"knowledge_id": knowledgeID,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return nil, err
|
|
}
|
|
|
|
logger.Infof(ctx, "Retrieved %d chunks successfully", len(chunks))
|
|
return chunks, nil
|
|
}
|
|
|
|
// ListPagedChunksByKnowledgeID lists chunks for a knowledge ID with pagination
|
|
// This method retrieves chunks with pagination support for better performance with large datasets
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - knowledgeID: ID of the knowledge document
|
|
// - page: Pagination parameters including page number and page size
|
|
//
|
|
// Returns:
|
|
// - *types.PageResult: Paginated result containing chunks and pagination metadata
|
|
// - error: Any error encountered during retrieval
|
|
func (s *chunkService) ListPagedChunksByKnowledgeID(ctx context.Context,
|
|
knowledgeID string, page *types.Pagination,
|
|
) (*types.PageResult, error) {
|
|
logger.Info(ctx, "Start listing paged chunks by knowledge ID")
|
|
logger.Infof(ctx, "Knowledge ID: %s, page: %d, page size: %d", knowledgeID, page.Page, page.PageSize)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
chunkType := []types.ChunkType{types.ChunkTypeText}
|
|
chunks, total, err := s.chunkRepository.ListPagedChunksByKnowledgeID(ctx, tenantID, knowledgeID, page, chunkType)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"knowledge_id": knowledgeID,
|
|
"tenant_id": tenantID,
|
|
"page": page.Page,
|
|
"page_size": page.PageSize,
|
|
})
|
|
return nil, err
|
|
}
|
|
|
|
logger.Infof(ctx, "Retrieved %d chunks out of %d total chunks", len(chunks), total)
|
|
return types.NewPageResult(total, page, chunks), nil
|
|
}
|
|
|
|
// updateChunk updates a chunk
|
|
// This method updates an existing chunk in the repository
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - chunk: Chunk with updated fields
|
|
//
|
|
// Returns:
|
|
// - error: Any error encountered during update
|
|
//
|
|
// This method handles the actual update logic for a chunk, including updating the vector database representation
|
|
func (s *chunkService) UpdateChunk(ctx context.Context, chunk *types.Chunk) error {
|
|
logger.Infof(ctx, "Updating chunk, ID: %s, knowledge ID: %s", chunk.ID, chunk.KnowledgeID)
|
|
|
|
// Update the chunk in the repository
|
|
err := s.chunkRepository.UpdateChunk(ctx, chunk)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"chunk_id": chunk.ID,
|
|
"knowledge_id": chunk.KnowledgeID,
|
|
})
|
|
return err
|
|
}
|
|
|
|
logger.Info(ctx, "Chunk updated successfully")
|
|
return nil
|
|
}
|
|
|
|
// DeleteChunk deletes a chunk by ID
|
|
// This method removes a specific chunk from the repository
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - id: ID of the chunk to delete
|
|
//
|
|
// Returns:
|
|
// - error: Any error encountered during deletion
|
|
func (s *chunkService) DeleteChunk(ctx context.Context, id string) error {
|
|
logger.Info(ctx, "Start deleting chunk")
|
|
logger.Infof(ctx, "Deleting chunk, ID: %s", id)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
|
|
err := s.chunkRepository.DeleteChunk(ctx, tenantID, id)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"chunk_id": id,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return err
|
|
}
|
|
|
|
logger.Info(ctx, "Chunk deleted successfully")
|
|
return nil
|
|
}
|
|
|
|
// DeleteChunksByKnowledgeID deletes all chunks for a knowledge ID
|
|
// This method removes all chunks belonging to a specific knowledge document
|
|
// Parameters:
|
|
// - ctx: Context with authentication and request information
|
|
// - knowledgeID: ID of the knowledge document
|
|
//
|
|
// Returns:
|
|
// - error: Any error encountered during bulk deletion
|
|
func (s *chunkService) DeleteChunksByKnowledgeID(ctx context.Context, knowledgeID string) error {
|
|
logger.Info(ctx, "Start deleting all chunks by knowledge ID")
|
|
logger.Infof(ctx, "Knowledge ID: %s", knowledgeID)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
|
|
err := s.chunkRepository.DeleteChunksByKnowledgeID(ctx, tenantID, knowledgeID)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"knowledge_id": knowledgeID,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return err
|
|
}
|
|
|
|
logger.Info(ctx, "All chunks under knowledge deleted successfully")
|
|
return nil
|
|
}
|
|
|
|
func (s *chunkService) DeleteByKnowledgeList(ctx context.Context, ids []string) error {
|
|
logger.Info(ctx, "Start deleting all chunks by knowledge IDs")
|
|
logger.Infof(ctx, "Knowledge IDs: %v", ids)
|
|
|
|
tenantID := ctx.Value(types.TenantIDContextKey).(uint)
|
|
logger.Infof(ctx, "Tenant ID: %d", tenantID)
|
|
|
|
err := s.chunkRepository.DeleteByKnowledgeList(ctx, tenantID, ids)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"knowledge_id": ids,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return err
|
|
}
|
|
|
|
logger.Info(ctx, "All chunks under knowledge deleted successfully")
|
|
return nil
|
|
}
|
|
|
|
func (s *chunkService) ListChunkByParentID(ctx context.Context, tenantID uint, parentID string) ([]*types.Chunk, error) {
|
|
logger.Info(ctx, "Start listing chunk by parent ID")
|
|
logger.Infof(ctx, "Parent ID: %s", parentID)
|
|
|
|
chunks, err := s.chunkRepository.ListChunkByParentID(ctx, tenantID, parentID)
|
|
if err != nil {
|
|
logger.ErrorWithFields(ctx, err, map[string]interface{}{
|
|
"parent_id": parentID,
|
|
"tenant_id": tenantID,
|
|
})
|
|
return nil, err
|
|
}
|
|
|
|
logger.Info(ctx, "Chunk listed successfully")
|
|
return chunks, nil
|
|
}
|