vella-backend / _utils /models /gerar_relatorio.py
luanpoppe
fix: adicionando opção de não utilizar o contextualized chunks temporariamente
1286e81
raw
history blame
594 Bytes
from typing import List, Dict, Tuple, Optional
from dataclasses import dataclass
import numpy as np
@dataclass
class DocumentChunk:
content: str
page_number: int
chunk_id: str
start_char: int
end_char: int
@dataclass
class RetrievalConfig:
num_chunks: int = 5
embedding_weight: float = 0.5
bm25_weight: float = 0.5
context_window: int = 3
chunk_overlap: int = 200
chunk_size: int = 1000
@dataclass
class ContextualizedChunk(DocumentChunk):
context: str = ""
embedding: Optional[np.ndarray] = None
bm25_score: Optional[float] = None