Spaces:

luanpoppe
/

vella-backend

Running

App Files Files Community

luanpoppe commited on Dec 9, 2024

Commit

1286e81

1 Parent(s): c66a7e7

fix: adicionando opção de não utilizar o contextualized chunks temporariamente

Browse files

Files changed (23) hide show

_utils/gerar_relatorio_modelo_usuario/ContextualRetriever_original.py +96 -0
_utils/gerar_relatorio_modelo_usuario/DocumentSummarizer_simples.py +273 -0
_utils/gerar_relatorio_modelo_usuario/EnhancedDocumentSummarizer.py +260 -0
_utils/gerar_relatorio_modelo_usuario/contextual_retriever.py +127 -0
_utils/gerar_relatorio_modelo_usuario/llm_calls.py +24 -0
_utils/gerar_relatorio_modelo_usuario/prompts.py +111 -0
_utils/models/gerar_relatorio.py +29 -0
_utils/ragas.py +168 -0
_utils/resumo_completo_cursor.py +56 -788
gerar_relatorio_modelo_usuario/__init__.py +0 -0
gerar_relatorio_modelo_usuario/admin.py +3 -0
gerar_relatorio_modelo_usuario/apps.py +6 -0
gerar_relatorio_modelo_usuario/migrations/__init__.py +0 -0
gerar_relatorio_modelo_usuario/models.py +3 -0
gerar_relatorio_modelo_usuario/serializer.py +33 -0
gerar_relatorio_modelo_usuario/tests.py +3 -0
gerar_relatorio_modelo_usuario/views.py +60 -0
ragas_api/serializer.py +1 -1
ragas_api/views.py +1 -1
resumos/serializer.py +0 -124
resumos/views.py +0 -170
setup/settings.py +1 -0
setup/urls.py +2 -2

_utils/gerar_relatorio_modelo_usuario/ContextualRetriever_original.py ADDED Viewed

	@@ -0,0 +1,96 @@

+from typing import List, Dict, Tuple, Optional
+from anthropic import Anthropic
+import logging
+from _utils.models.gerar_relatorio import (
+    ContextualizedChunk,
+    DocumentChunk,
+    RetrievalConfig,
+)
+from langchain.schema import Document
+class ContextualRetriever:
+    def __init__(
+        self, config: RetrievalConfig, claude_api_key: str, claude_context_model
+    ):
+        self.config = config  # Este self.config no momento não está sendo utilizada para nada dentro desta classe. Analisar se deveria estar sendo utilizada.
+        self.claude_client = Anthropic(api_key=claude_api_key)
+        self.logger = logging.getLogger(__name__)
+        self.bm25 = None
+        self.claude_context_model = claude_context_model
+    def generate_context(self, full_text: str, chunk: DocumentChunk) -> str:
+        """Generate contextual description using Claude"""
+        try:
+            # prompt = f"""<document>
+            # {full_text}
+            # </document>
+            # Here is the chunk we want to situate within the whole document
+            # <chunk>
+            # {chunk.content}
+            # </chunk>
+            # Please give a short succinct context to situate this chunk within the overall document for the purposes of improving search retrieval of the chunk. Answer only with the succinct context and nothing else."""
+            prompt = f"""You are a language model tasked with providing context to improve the retrieval of information from a chunk extracted from a document. Follow these steps internally (do not display reasoning or reflection in the final output):
+1. **Chain of Thought (internal)**:
+- Identify the document ID, which is the value between "NUM." and "- Pág".
+- Identify the document name from the header.
+2. **Reflection (internal)**:
+- Confirm the document ID and name are correctly identified.
+- Ensure the final context is concise and helpful.
+3. **Final Response**:
+- Provide a short context situating the *chunk* within the document, including the document ID and document name.
+- Do not include any reasoning or reflection in your response.
+**Example Usage:**
+```
+<document> {full_text} </document>
+<chunk> {chunk.content} </chunk>
+Please return only the succinct context (without displaying your internal reasoning), including the document ID and the document name.
+```
+"""
+            response = self.claude_client.messages.create(
+                model=self.claude_context_model,
+                max_tokens=100,
+                messages=[{"role": "user", "content": prompt}],
+            )
+            return response.content[
+                0
+            ].text  # O response.content é uma lista pois é passada uma lista de mensagens, e também retornado uma lista de mensagens, sendo a primeira a mais recente, que é a resposta do model
+        except Exception as e:
+            self.logger.error(
+                f"Context generation failed for chunk {chunk.chunk_id}: {str(e)}"
+            )
+            return ""
+    def contextualize_all_chunks(
+        self, full_text: List[Document], chunks: List[DocumentChunk]
+    ) -> List[
+        ContextualizedChunk
+    ]:  # Pega um chunk e apenas adiciona uma propriedade de contexto a ela, sendo esta propriedade a resposta da função acima, que chama um Model do Claude para dizer o contexto de um chunk
+        """Add context to all chunks"""
+        smaller_context = ""
+        contextualized_chunks = []
+        print("\n\n")
+        print("len(chunks): ", len(chunks))
+        for chunk in chunks:
+            contador_pagina = -1
+            while contador_pagina <= 1:
+                local_page = full_text[chunk.page_number + contador_pagina]
+                if local_page:
+                    smaller_context += local_page.page_content
+                contador_pagina += 1
+            print("chunk.page_number: ", chunk.page_number)
+            context = self.generate_context(smaller_context, chunk)
+            contextualized_chunk = ContextualizedChunk(
+                content=chunk.content,
+                page_number=chunk.page_number,
+                chunk_id=chunk.chunk_id,
+                start_char=chunk.start_char,
+                end_char=chunk.end_char,
+                context=context,
+            )
+            contextualized_chunks.append(contextualized_chunk)
+        return contextualized_chunks

_utils/gerar_relatorio_modelo_usuario/DocumentSummarizer_simples.py ADDED Viewed

	@@ -0,0 +1,273 @@

+import os
+from typing import List, Dict, Tuple, Optional
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.document_loaders import PyPDFLoader
+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_community.vectorstores import Chroma
+from langchain_community.chat_models import ChatOpenAI
+from langchain.prompts import PromptTemplate
+import uuid
+import logging
+from cohere import Client
+from _utils.models.gerar_relatorio import (
+    DocumentChunk,
+)
+from langchain.schema import Document
+class DocumentSummarizer:
+    def __init__(
+        self,
+        openai_api_key: str,
+        cohere_api_key: str,
+        embedding_model,
+        chunk_size,
+        chunk_overlap,
+        num_k_rerank,
+        model_cohere_rerank,
+    ):
+        self.openai_api_key = openai_api_key
+        self.cohere_client = Client(cohere_api_key)
+        self.embeddings = HuggingFaceEmbeddings(model_name=embedding_model)
+        self.text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=chunk_size, chunk_overlap=chunk_overlap
+        )
+        self.chunk_metadata = {}  # Store chunk metadata for tracing
+        self.num_k_rerank = num_k_rerank
+        self.model_cohere_rerank = model_cohere_rerank
+    def load_and_split_document(self, pdf_path: str) -> List[DocumentChunk]:
+        """Load PDF and split into chunks with metadata"""
+        loader = PyPDFLoader(pdf_path)
+        pages = (
+            loader.load()
+        )  # Gera uma lista de objetos Document, sendo cada item da lista referente a UMA PÁGINA inteira do PDF.
+        chunks = []
+        char_count = 0
+        for page in pages:
+            text = page.page_content
+            page_chunks = self.text_splitter.split_text(
+                text
+            )  # Quebra o item que é um Document de UMA PÁGINA inteira em um lista onde cada item é referente a um chunk, que são pedaços menores do que uma página.
+            for chunk in page_chunks:
+                chunk_id = str(uuid.uuid4())
+                start_char = text.find(
+                    chunk
+                )  # Retorna a posição onde se encontra o chunk dentro da página inteira
+                end_char = start_char + len(chunk)
+                doc_chunk = DocumentChunk(  # Gera o objeto do chunk com informações adicionais, como a posição e id do chunk
+                    content=chunk,
+                    page_number=page.metadata.get("page") + 1,  # 1-based page numbering
+                    chunk_id=chunk_id,
+                    start_char=char_count + start_char,
+                    end_char=char_count + end_char,
+                )
+                chunks.append(doc_chunk)
+                # Store metadata for later retrieval
+                self.chunk_metadata[chunk_id] = {
+                    "page": doc_chunk.page_number,
+                    "start_char": doc_chunk.start_char,
+                    "end_char": doc_chunk.end_char,
+                }
+            char_count += len(text)
+        return chunks
+    def load_and_split_text(self, text: str) -> List[DocumentChunk]:
+        """Load Text and split into chunks with metadata - Criei essa função apenas para o ragas"""
+        page = Document(page_content=text, metadata={"page": 1})
+        chunks = []
+        char_count = 0
+        text = page.page_content
+        page_chunks = self.text_splitter.split_text(
+            text
+        )  # Quebra o item que é um Document de UMA PÁGINA inteira em um lista onde cada item é referente a um chunk, que são pedaços menores do que uma página.
+        print("\n\n\n")
+        print("page_chunks: ", page_chunks)
+        for chunk in page_chunks:
+            chunk_id = str(uuid.uuid4())
+            start_char = text.find(
+                chunk
+            )  # Retorna a posição onde se encontra o chunk dentro da página inteira
+            end_char = start_char + len(chunk)
+            doc_chunk = DocumentChunk(  # Gera o objeto do chunk com informações adicionais, como a posição e id do chunk
+                content=chunk,
+                page_number=page.metadata.get("page") + 1,  # 1-based page numbering
+                chunk_id=chunk_id,
+                start_char=char_count + start_char,
+                end_char=char_count + end_char,
+            )
+            chunks.append(doc_chunk)
+            # Store metadata for later retrieval
+            self.chunk_metadata[chunk_id] = {
+                "page": doc_chunk.page_number,
+                "start_char": doc_chunk.start_char,
+                "end_char": doc_chunk.end_char,
+            }
+        char_count += len(text)
+        return chunks
+    def create_vector_store(
+        self, chunks: List[DocumentChunk]
+    ) -> Chroma:  # Esta função nunca está sendo utilizada
+        """Create vector store with metadata"""
+        texts = [chunk.content for chunk in chunks]
+        metadatas = [
+            {
+                "chunk_id": chunk.chunk_id,
+                "page": chunk.page_number,
+                "start_char": chunk.start_char,
+                "end_char": chunk.end_char,
+            }
+            for chunk in chunks
+        ]
+        vector_store = Chroma.from_texts(
+            texts=texts, metadatas=metadatas, embedding=self.embeddings
+        )
+        return vector_store
+    def rerank_chunks(  # Esta função nunca está sendo utilizada
+        self, chunks: List[Dict], query: str, k: int = 5
+    ) -> List[Dict]:
+        """
+        Rerank chunks using Cohere's reranking model.
+        Args:
+            chunks: List of dictionaries containing chunks and their metadata
+            query: Original search query
+            k: Number of top chunks to return
+        Returns:
+            List of reranked chunks with updated relevance scores
+        """
+        try:
+            # Prepare documents for reranking
+            documents = [chunk["content"] for chunk in chunks]
+            # Get reranking scores from Cohere
+            results = self.cohere_client.rerank(
+                query=query,
+                documents=documents,
+                top_n=k,
+                model=self.model_cohere_rerank,
+            )
+            # Create reranked results with original metadata
+            reranked_chunks = []
+            for hit in results:
+                original_chunk = chunks[hit.index]
+                reranked_chunks.append(
+                    {**original_chunk, "relevance_score": hit.relevance_score}
+                )
+            return reranked_chunks
+        except Exception as e:
+            logging.error(f"Reranking failed: {str(e)}")
+            return chunks[:k]  # Fallback to original ordering
+    def generate_summary_with_sources(  # Esta função nunca está sendo utilizada
+        self,
+        vector_store: Chroma,
+        query: str = "Summarize the main points of this document",
+    ) -> List[Dict]:
+        """Generate summary with source citations using reranking"""
+        # Retrieve more initial chunks for reranking
+        relevant_docs = vector_store.similarity_search_with_score(query, k=20)
+        # Prepare chunks for reranking
+        chunks = []
+        for doc, score in relevant_docs:
+            chunks.append(
+                {
+                    "content": doc.page_content,
+                    "page": doc.metadata["page"],
+                    "chunk_id": doc.metadata["chunk_id"],
+                    "relevance_score": score,
+                }
+            )
+        # Rerank chunks
+        reranked_chunks = self.rerank_chunks(chunks, query, k=self.num_k_rerank)
+        # Prepare context and sources from reranked chunks
+        contexts = []
+        sources = []
+        for chunk in reranked_chunks:
+            contexts.append(chunk["content"])
+            sources.append(
+                {
+                    "content": chunk["content"],
+                    "page": chunk["page"],
+                    "chunk_id": chunk["chunk_id"],
+                    "relevance_score": chunk["relevance_score"],
+                }
+            )
+        prompt_template = """
+        Based on the following context, provide multiple key points from the document.
+        For each point, create a new paragraph.
+        Each paragraph should be a complete, self-contained insight.
+        Context: {context}
+        Key points:
+        """
+        prompt = PromptTemplate(template=prompt_template, input_variables=["context"])
+        llm = ChatOpenAI(
+            temperature=0, model_name="gpt-4o-mini", api_key=self.openai_api_key
+        )
+        response = llm.predict(prompt.format(context="\n\n".join(contexts)))
+        # Split the response into paragraphs
+        summaries = [p.strip() for p in response.split("\n\n") if p.strip()]
+        # Create structured output
+        structured_output = []
+        for idx, summary in enumerate(summaries):
+            # Associate each summary with the most relevant source
+            structured_output.append(
+                {
+                    "content": summary,
+                    "source": {
+                        "page": sources[min(idx, len(sources) - 1)]["page"],
+                        "text": sources[min(idx, len(sources) - 1)]["content"][:200]
+                        + "...",
+                        "relevance_score": sources[min(idx, len(sources) - 1)][
+                            "relevance_score"
+                        ],
+                    },
+                }
+            )
+        return structured_output
+    def get_source_context(
+        self, chunk_id: str, window: int = 100
+    ) -> Dict:  # Esta função nunca está sendo utilizada
+        """Get extended context around a specific chunk"""
+        metadata = self.chunk_metadata.get(chunk_id)
+        if not metadata:
+            return None
+        return {
+            "page": metadata["page"],
+            "start_char": metadata["start_char"],
+            "end_char": metadata["end_char"],
+        }

_utils/gerar_relatorio_modelo_usuario/EnhancedDocumentSummarizer.py ADDED Viewed

	@@ -0,0 +1,260 @@

+import os
+from typing import List, Dict, Tuple, Optional
+from langchain_community.vectorstores import Chroma
+from langchain_community.chat_models import ChatOpenAI
+from langchain.chains import create_extraction_chain
+from langchain.prompts import PromptTemplate
+from rank_bm25 import BM25Okapi
+import logging
+import requests
+from _utils.gerar_relatorio_modelo_usuario.DocumentSummarizer_simples import (
+    DocumentSummarizer,
+)
+from _utils.models.gerar_relatorio import (
+    ContextualizedChunk,
+    RetrievalConfig,
+)
+from setup.environment import api_url
+from rest_framework.response import Response
+from _utils.gerar_relatorio_modelo_usuario.contextual_retriever import (
+    ContextualRetriever,
+)
+class EnhancedDocumentSummarizer(DocumentSummarizer):
+    def __init__(
+        self,
+        openai_api_key: str,
+        claude_api_key: str,
+        config: RetrievalConfig,
+        embedding_model,
+        chunk_size,
+        chunk_overlap,
+        num_k_rerank,
+        model_cohere_rerank,
+        claude_context_model,
+        prompt_relatorio,
+        gpt_model,
+        gpt_temperature,
+        id_modelo_do_usuario,
+        prompt_modelo,
+        reciprocal_rank_fusion,
+    ):
+        super().__init__(
+            openai_api_key,
+            os.environ.get("COHERE_API_KEY"),
+            embedding_model,
+            chunk_size,
+            chunk_overlap,
+            num_k_rerank,
+            model_cohere_rerank,
+        )
+        self.config = config
+        self.contextual_retriever = ContextualRetriever(
+            config, claude_api_key, claude_context_model
+        )
+        self.logger = logging.getLogger(__name__)
+        self.prompt_relatorio = prompt_relatorio
+        self.gpt_model = gpt_model
+        self.gpt_temperature = gpt_temperature
+        self.id_modelo_do_usuario = id_modelo_do_usuario
+        self.prompt_modelo = prompt_modelo
+        self.reciprocal_rank_fusion = reciprocal_rank_fusion
+    def create_enhanced_vector_store(
+        self, chunks: List[ContextualizedChunk], is_contextualized_chunk
+    ) -> Tuple[Chroma, BM25Okapi, List[str]]:
+        """Create vector store and BM25 index with contextualized chunks"""
+        try:
+            # Prepare texts with context
+            if is_contextualized_chunk:
+                texts = [f"{chunk.context} {chunk.content}" for chunk in chunks]
+            else:
+                texts = [f"{chunk.content}" for chunk in chunks]
+            # Create vector store
+            metadatas = []
+            for chunk in chunks:
+                if is_contextualized_chunk:
+                    context = chunk.context
+                else:
+                    context = ""
+                metadatas.append(
+                    {
+                        "chunk_id": chunk.chunk_id,
+                        "page": chunk.page_number,
+                        "start_char": chunk.start_char,
+                        "end_char": chunk.end_char,
+                        "context": context,
+                    }
+                )
+            vector_store = Chroma.from_texts(
+                texts=texts, metadatas=metadatas, embedding=self.embeddings
+            )
+            # Create BM25 index
+            tokenized_texts = [text.split() for text in texts]
+            bm25 = BM25Okapi(tokenized_texts)
+            # Get chunk IDs in order
+            chunk_ids = [chunk.chunk_id for chunk in chunks]
+            return vector_store, bm25, chunk_ids
+        except Exception as e:
+            self.logger.error(f"Error creating enhanced vector store: {str(e)}")
+            raise
+    def retrieve_with_rank_fusion(
+        self, vector_store: Chroma, bm25: BM25Okapi, chunk_ids: List[str], query: str
+    ) -> List[Dict]:
+        """Combine embedding and BM25 retrieval results"""
+        try:
+            # Get embedding results
+            embedding_results = vector_store.similarity_search_with_score(
+                query, k=self.config.num_chunks
+            )
+            # Convert embedding results to list of (chunk_id, score)
+            embedding_list = [
+                (doc.metadata["chunk_id"], 1 / (1 + score))
+                for doc, score in embedding_results
+            ]
+            # Get BM25 results
+            tokenized_query = query.split()
+            bm25_scores = bm25.get_scores(tokenized_query)
+            # Convert BM25 scores to list of (chunk_id, score)
+            bm25_list = [
+                (chunk_ids[i], float(score)) for i, score in enumerate(bm25_scores)
+            ]
+            # Sort bm25_list by score in descending order and limit to top N results
+            bm25_list = sorted(bm25_list, key=lambda x: x[1], reverse=True)[
+                : self.config.num_chunks
+            ]
+            # Normalize BM25 scores
+            calculo_max = max(
+                [score for _, score in bm25_list]
+            )  # Criei este max() pois em alguns momentos estava vindo valores 0, e reclamava que não podia dividir por 0
+            max_bm25 = calculo_max if bm25_list and calculo_max else 1
+            bm25_list = [(doc_id, score / max_bm25) for doc_id, score in bm25_list]
+            # Pass the lists to rank fusion
+            result_lists = [embedding_list, bm25_list]
+            weights = [self.config.embedding_weight, self.config.bm25_weight]
+            combined_results = self.reciprocal_rank_fusion(
+                result_lists, weights=weights
+            )
+            return combined_results
+        except Exception as e:
+            self.logger.error(f"Error in rank fusion retrieval: {str(e)}")
+            raise
+    def generate_enhanced_summary(
+        self,
+        vector_store: Chroma,
+        bm25: BM25Okapi,
+        chunk_ids: List[str],
+        query: str = "Summarize the main points of this document",
+    ) -> List[Dict]:
+        """Generate enhanced summary using both vector and BM25 retrieval"""
+        try:
+            # Get combined results using rank fusion
+            ranked_results = self.retrieve_with_rank_fusion(
+                vector_store, bm25, chunk_ids, query
+            )
+            # Prepare context and track sources
+            contexts = []
+            sources = []
+            # Get full documents for top results
+            for chunk_id, score in ranked_results[: self.config.num_chunks]:
+                results = vector_store.get(
+                    where={"chunk_id": chunk_id}, include=["documents", "metadatas"]
+                )
+                if results["documents"]:
+                    context = results["documents"][0]
+                    metadata = results["metadatas"][0]
+                    contexts.append(context)
+                    sources.append(
+                        {
+                            "content": context,
+                            "page": metadata["page"],
+                            "chunk_id": chunk_id,
+                            "relevance_score": score,
+                            "context": metadata.get("context", ""),
+                        }
+                    )
+            url_request = f"{api_url}/modelo/{self.id_modelo_do_usuario}"
+            resposta = requests.get(url_request)
+            if resposta.status_code != 200:
+                return Response(
+                    {
+                        "error": "Ocorreu um problema. Pode ser que o modelo não tenha sido encontrado. Tente novamente e/ou entre em contato com a equipe técnica"
+                    }
+                )
+            modelo_buscado = resposta.json()["modelo"]
+            llm = ChatOpenAI(
+                temperature=self.gpt_temperature,
+                model_name=self.gpt_model,
+                api_key=self.openai_api_key,
+            )
+            prompt_gerar_relatorio = PromptTemplate(
+                template=self.prompt_relatorio, input_variables=["context"]
+            )
+            relatorio_gerado = llm.predict(
+                prompt_gerar_relatorio.format(context="\n\n".join(contexts))
+            )
+            prompt_gerar_modelo = PromptTemplate(
+                template=self.prompt_modelo,
+                input_variables=["context", "modelo_usuario"],
+            )
+            modelo_gerado = llm.predict(
+                prompt_gerar_modelo.format(
+                    context=relatorio_gerado, modelo_usuario=modelo_buscado
+                )
+            )
+            # Split the response into paragraphs
+            summaries = [p.strip() for p in modelo_gerado.split("\n\n") if p.strip()]
+            # Create structured output
+            structured_output = []
+            for idx, summary in enumerate(summaries):
+                source_idx = min(idx, len(sources) - 1)
+                structured_output.append(
+                    {
+                        "content": summary,
+                        "source": {
+                            "page": sources[source_idx]["page"],
+                            "text": sources[source_idx]["content"][:200] + "...",
+                            "context": sources[source_idx]["context"],
+                            "relevance_score": sources[source_idx]["relevance_score"],
+                            "chunk_id": sources[source_idx]["chunk_id"],
+                        },
+                    }
+                )
+            return structured_output
+        except Exception as e:
+            self.logger.error(f"Error generating enhanced summary: {str(e)}")
+            raise

_utils/gerar_relatorio_modelo_usuario/contextual_retriever.py ADDED Viewed

	@@ -0,0 +1,127 @@

+import os
+from langchain_openai import ChatOpenAI
+from typing import List, Dict, Tuple, Optional
+from anthropic import Anthropic
+import logging
+from langchain.schema import Document
+import asyncio
+from langchain.prompts import PromptTemplate
+from typing import List
+from multiprocessing import Process, Barrier, Queue
+from dataclasses import dataclass
+from langchain_core.messages import HumanMessage
+from _utils.gerar_relatorio_modelo_usuario.llm_calls import claude_answer, gpt_answer
+from _utils.gerar_relatorio_modelo_usuario.prompts import contextual_prompt
+from _utils.models.gerar_relatorio import (
+    ContextualizedChunk,
+    DocumentChunk,
+    RetrievalConfig,
+)
+lista_contador = []
+def task(name, barrier, queue, chunk, full_text, config, claude_context_model):
+    """Função independente para processar um chunk."""
+    print(f"Process {name} ready")
+    barrier.wait()  # Espera todos os processos estarem prontos
+    retriever = ContextualRetriever(config, None, claude_context_model)
+    result = retriever.create_contextualized_chunk(chunk, full_text)
+    queue.put(result)  # Armazena o resultado na fila
+class ContextualRetriever:
+    def __init__(
+        self, config: RetrievalConfig, claude_api_key: str, claude_context_model: str
+    ):
+        self.config = config
+        self.claude_client = Anthropic(api_key=claude_api_key)
+        self.logger = logging.getLogger(__name__)
+        self.bm25 = None
+        self.claude_context_model = claude_context_model
+    def llm_generate_context(self, full_text: str, chunk: DocumentChunk) -> str:
+        """Generate contextual description using ChatOpenAI"""
+        try:
+            prompt = contextual_prompt(full_text, chunk.content)
+            print("COMEÇOU A REQUISIÇÃO")
+            # response = claude_answer(self.claude_client, self.claude_context_model, prompt)
+            response = gpt_answer(prompt)
+            return response
+        except Exception as e:
+            self.logger.error(
+                f"Context generation failed for chunk {chunk.chunk_id}: {str(e)}"
+            )
+            return ""
+    def create_contextualized_chunk(self, chunk, full_text):
+        lista_contador.append(0)
+        print("contador: ", len(lista_contador))
+        page_content = ""
+        for i in range(
+            max(0, chunk.page_number - 1),
+            min(len(full_text), chunk.page_number + 2),
+        ):
+            page_content += full_text[i].page_content if full_text[i] else ""
+        context = self.llm_generate_context(page_content, chunk)
+        return ContextualizedChunk(
+            content=chunk.content,
+            page_number=chunk.page_number,
+            chunk_id=chunk.chunk_id,
+            start_char=chunk.start_char,
+            end_char=chunk.end_char,
+            context=context,
+        )
+    def contextualize_all_chunks(
+        self, full_text: List[Document], chunks: List[DocumentChunk]
+    ) -> List[ContextualizedChunk]:
+        """Add context to all chunks"""
+        contextualized_chunks = []
+        # tasks = [create_contextualized_chunk(chunk) for chunk in chunks]
+        # contextualized_chunks = await asyncio.gather(*tasks)
+        contextualized_chunks = self.main(chunks, full_text)
+        return contextualized_chunks
+    # def task(self, name, barrier, queue, chunk, full_text):
+    #     print(f"Process {name} ready")
+    #     barrier.wait()  # Wait for all processes to be ready
+    #     result = self.create_contextualized_chunk(chunk, full_text)
+    #     queue.put(result)  # Store the result in the queue
+    def main(self, chunks, full_text):
+        barrier = Barrier(1)
+        queue = Queue()
+        processes = []
+        for i in range(len(chunks)):
+            p = Process(
+                target=task,
+                args=(
+                    f"P{i+1}",
+                    barrier,
+                    queue,
+                    chunks[i],
+                    full_text,
+                    self.config,
+                    self.claude_context_model,
+                ),
+            )
+            processes.append(p)
+            p.start()
+        results = []
+        for p in processes:
+            p.join()
+        # Collect results from the queue
+        while not queue.empty():
+            print("queue.get(): ", queue.get())
+            results.append(queue.get())
+        return results

_utils/gerar_relatorio_modelo_usuario/llm_calls.py ADDED Viewed

	@@ -0,0 +1,24 @@

+import os
+from langchain_core.messages import HumanMessage
+from langchain_openai import ChatOpenAI
+def claude_answer(claude_client, claude_context_model, prompt):
+    response = claude_client.messages.create(
+        model=claude_context_model,
+        max_tokens=100,
+        messages=[{"role": "user", "content": prompt}],
+    )
+    return response.content[
+        0
+    ].text  # O response.content é uma lista pois é passada uma lista de mensagens, e também retornado uma lista de mensagens, sendo a primeira a mais recente, que é a resposta do model
+def gpt_answer(prompt):
+    gpt = ChatOpenAI(
+        temperature=0,
+        model="gpt-4o-mini",
+        api_key=os.environ.get("OPENAI_API_KEY"),
+    )
+    response = gpt.invoke([HumanMessage(content=prompt)])
+    return response.content

_utils/gerar_relatorio_modelo_usuario/prompts.py ADDED Viewed

	@@ -0,0 +1,111 @@

+def contextual_prompt(full_text, chunk_content):
+    return f"""You are a language model tasked with providing context to improve the retrieval of information from a chunk extracted from a document. Follow these steps internally (do not display reasoning or reflection in the final output):
+1. **Chain of Thought (internal)**:
+- Identify the document ID, which is the value between "NUM." and "- Pág".
+- Identify the document name from the header.
+2. **Reflection (internal)**:
+- Confirm the document ID and name are correctly identified.
+- Ensure the final context is concise and helpful.
+3. **Final Response**:
+- Provide a short context situating the *chunk* within the document, including the document ID and document name.
+- Do not include any reasoning or reflection in your response.
+**Example Usage:**
+```
+<document> {full_text} </document>
+<chunk> {chunk_content} </chunk>
+Please return only the succinct context (without displaying your internal reasoning), including the document ID and the document name.
+```
+"""
+# system_prompt_modelo = """
+#             Based on the following context, provide multiple key points from the document.
+#             For each point, create a new paragraph.
+#             Each paragraph should be a complete, self-contained insight.
+#             Include any relevant context provided.
+#             Context: {context}
+#             Modelo do usuário: {modelo_usuario}
+#             Key points:
+#             """
+system_prompt_modelo = """
+You are a large language model that must produce a single final sentence in **Portuguese**. To do this, you will follow a private chain of thought and then produce a final answer. The final answer must follow the formatting and stylistic conventions shown in the user-provided model `user's template`. The information to be included in the final sentence is derived from the `context` (a report describing a legal case).
+**Contextual Information (provided separately):**
+{context}
+**User Model (provided separately):**
+{modelo_usuario}
+**Instructions:**
+1. **Goal:** Produce one single final sentence in Portuguese that matches the structure, format, and style given by `user's template`.
+2. **Chain of Thought (private to the assistant and not to be shown in the final answer):**
+- Carefully review the `context` which is a legal report of a case.
+- Identify:
+- The defendant’s name.
+- The crime’s name, its article, and any subsection (inciso).
+- The date of receipt of the complaint (data do recebimento da denúncia).
+- The document ID.
+- Ensure these elements are correctly incorporated into the final sentence.
+- Check compliance with the formatting style indicated by `user's template`.
+- Compose the sentence following the structure from the user model.
+- Use reflection: Before finalizing the answer, reassess if all required information is included, if the format matches the user model, and if the sentence is written correctly in Portuguese.
+3. **Reflection Technique (private):**
+After composing the sentence, but before presenting it as the final answer, reflect if:
+- All required details from the `context` are accurately included.
+- The sentence format strictly matches the pattern of `user's template`.
+- The sentence is grammatically correct in Portuguese.
+4. **Final Answer:**
+- After completing the chain of thought and ensuring correctness through reflection, present only the final sentence in Portuguese.
+- Do not show the chain of thought or the reflection step. Only the final formatted sentence should be visible to the user.
+"""
+# system_prompt_relatorio = """
+#             Based on the following context, provide multiple key points from the document.
+#             For each point, create a new paragraph.
+#             Each paragraph should be a complete, self-contained insight.
+#             Include any relevant context provided.
+#             Context: {context}
+#             Key points:
+#             """
+system_prompt_relatorio = """
+You are a language model specialized in producing concise and well-structured legal case summaries in Portuguese. You will receive a variable `context`, which contains information about a legal case. Your task is to read the `context` carefully and produce a summary report in Portuguese, following the specific format provided below. Do not include any additional comments or reasoning steps in your final answer.
+**Instructions**:
+1. **Chain of Thought**: Before producing your final answer, you must think through and plan your summary silently, without showing this reasoning in the final output. The final answer must only contain the required formatted report and nothing else.
+2. **Reading the Context**: Extract the following information from `context`:
+- The name of the defendant (réu).
+- The crime they have been accused of (nome_do_crime).
+- The applicable article and subsection of the Penal Code (artigo_e_inciso_do_crime).
+- The date the accusation was accepted (data_do_recebimento).
+- The ID of the decision document (id_do_documento).
+3. **Prescriptive Details**: If no other interruptive or suspensive causes of prescription are mentioned, confirm that there are none.
+4. **Formatting**: Your final answer must strictly follow the format below, in Portuguese, and replace the placeholders with the appropriate information:
+```
+<formato>
+Trata-se de Ação Penal em que o Ministério Público denunciou [nome_do_reu], pela prática do [nome_do_crime] [artigo_e_inciso_do_crime], do Código Penal.
+A denúncia foi recebida em [data_do_recebimento], conforme Decisão [id_do_documento].
+Não há outras causas interruptivas ou suspensivas da prescrição.
+</formato>
+```
+5. **Completeness**: If any piece of required information is missing in the `context`, note that explicitly in the final answer within the format.
+**Reminder**:
+- Do not include your chain of thought in the final output.
+- Do not add extra information or commentary beyond the specified format.
+- The final answer must be in Portuguese.
+---
+**Contextual Information (provided separately):**
+{context}
+---
+**Example with a given context**:
+- Input:
+`context` = "Em 10/03/2021, o Ministério Público denunciou João da Silva, imputando-lhe o crime de furto qualificado, previsto no art. 155, §4º, inciso II, do Código Penal. A denúncia foi recebida em 12/03/2021, conforme Decisão nº 20210312-01. Não há menção a qualquer causa interruptiva ou suspensiva da prescrição."
+- Expected final answer:
+```
+<formato>
+Trata-se de Ação Penal em que o Ministério Público denunciou João da Silva, pela prática do furto qualificado (art. 155, §4º, inciso II do Código Penal).
+A denúncia foi recebida em 12/03/2021, conforme Decisão 20210312-01.
+Não há outras causas interruptivas ou suspensivas da prescrição.
+</formato>
+"""

_utils/models/gerar_relatorio.py ADDED Viewed

	@@ -0,0 +1,29 @@

+from typing import List, Dict, Tuple, Optional
+from dataclasses import dataclass
+import numpy as np
+@dataclass
+class DocumentChunk:
+    content: str
+    page_number: int
+    chunk_id: str
+    start_char: int
+    end_char: int
+@dataclass
+class RetrievalConfig:
+    num_chunks: int = 5
+    embedding_weight: float = 0.5
+    bm25_weight: float = 0.5
+    context_window: int = 3
+    chunk_overlap: int = 200
+    chunk_size: int = 1000
+@dataclass
+class ContextualizedChunk(DocumentChunk):
+    context: str = ""
+    embedding: Optional[np.ndarray] = None
+    bm25_score: Optional[float] = None

_utils/ragas.py ADDED Viewed

	@@ -0,0 +1,168 @@

+import os
+from langchain_community.document_loaders import PyPDFLoader
+from _utils.resumo_completo_cursor import EnhancedDocumentSummarizer, RetrievalConfig
+from rest_framework.response import Response
+from ragas import evaluate
+from langchain.chains import SequentialChain
+from langchain.prompts import PromptTemplate
+# from langchain.schema import ChainResult
+from langchain.memory import SimpleMemory
+def test_ragas(serializer, listaPDFs):
+    # Step 2: Setup RetrievalConfig and EnhancedDocumentSummarizer
+    config = RetrievalConfig(
+        num_chunks=serializer["num_chunks_retrieval"],
+        embedding_weight=serializer["embedding_weight"],
+        bm25_weight=serializer["bm25_weight"],
+        context_window=serializer["context_window"],
+        chunk_overlap=serializer["chunk_overlap"],
+    )
+    summarizer = EnhancedDocumentSummarizer(
+        openai_api_key=os.environ.get("OPENAI_API_KEY"),
+        claude_api_key=os.environ.get("CLAUDE_API_KEY"),
+        config=config,
+        embedding_model=serializer["hf_embedding"],
+        chunk_overlap=serializer["chunk_overlap"],
+        chunk_size=serializer["chunk_size"],
+        num_k_rerank=serializer["num_k_rerank"],
+        model_cohere_rerank=serializer["model_cohere_rerank"],
+        claude_context_model=serializer["claude_context_model"],
+        prompt_relatorio=serializer["prompt_relatorio"],
+        gpt_model=serializer["model"],
+        gpt_temperature=serializer["gpt_temperature"],
+        id_modelo_do_usuario=serializer["id_modelo_do_usuario"],
+        prompt_modelo=serializer["prompt_modelo"],
+    )
+    # Step 1: Define the components
+    def load_and_split_documents(pdf_list, summarizer):
+        """Loads and splits PDF documents into chunks."""
+        all_chunks = []
+        for pdf_path in pdf_list:
+            chunks = summarizer.load_and_split_document(pdf_path)
+            all_chunks.extend(chunks)
+        return {"chunks": all_chunks}
+    def get_full_text_from_pdfs(pdf_list):
+        """Gets the full text from PDFs for contextualization."""
+        full_text = []
+        for pdf_path in pdf_list:
+            loader = PyPDFLoader(pdf_path)
+            pages = loader.load()
+            text = " ".join([page.page_content for page in pages])
+            full_text.append(text)
+        return {"full_text": " ".join(full_text)}
+    def contextualize_all_chunks(full_text, chunks, contextual_retriever):
+        """Adds context to chunks using Claude."""
+        contextualized_chunks = contextual_retriever.contextualize_all_chunks(
+            full_text, chunks
+        )
+        return {"contextualized_chunks": contextualized_chunks}
+    def create_vector_store(contextualized_chunks, summarizer):
+        """Creates an enhanced vector store and BM25 index."""
+        vector_store, bm25, chunk_ids = summarizer.create_enhanced_vector_store(
+            contextualized_chunks
+        )
+        return {"vector_store": vector_store, "bm25": bm25, "chunk_ids": chunk_ids}
+    def generate_summary(vector_store, bm25, chunk_ids, query, summarizer):
+        """Generates an enhanced summary using the vector store and BM25 index."""
+        structured_summaries = summarizer.generate_enhanced_summary(
+            vector_store, bm25, chunk_ids, query
+        )
+        return {"structured_summaries": structured_summaries}
+    # Step 3: Define Sequential Chain
+    chain = SequentialChain(
+        chains=[
+            lambda inputs: load_and_split_documents(inputs["pdf_list"], summarizer),
+            lambda inputs: get_full_text_from_pdfs(inputs["pdf_list"]),
+            lambda inputs: contextualize_all_chunks(
+                inputs["full_text"], inputs["chunks"], summarizer.contextual_retriever
+            ),
+            lambda inputs: create_vector_store(
+                inputs["contextualized_chunks"], summarizer
+            ),
+            lambda inputs: generate_summary(
+                inputs["vector_store"],
+                inputs["bm25"],
+                inputs["chunk_ids"],
+                inputs["user_message"],
+                summarizer,
+            ),
+        ],
+        input_variables=["pdf_list", "user_message"],
+        output_variables=["structured_summaries"],
+    )
+    from ragas.langchain.evalchain import RagasEvaluatorChain
+    from ragas.metrics import (
+        LLMContextRecall,
+        Faithfulness,
+        FactualCorrectness,
+        SemanticSimilarity,
+    )
+    from ragas import evaluate
+    from ragas.llms import LangchainLLMWrapper
+    # from ragas.embeddings import LangchainEmbeddingsWrapper
+    # evaluator_llm = LangchainLLMWrapper(ChatOpenAI(model="gpt-4o-mini"))
+    evaluator_llm = LangchainLLMWrapper(chain)
+    # evaluator_embeddings = LangchainEmbeddingsWrapper(OpenAIEmbeddings())
+    from datasets import load_dataset
+    dataset = load_dataset(
+        "explodinggradients/amnesty_qa", "english_v3", trust_remote_code=True
+    )
+    from ragas import EvaluationDataset
+    eval_dataset = EvaluationDataset.from_hf_dataset(dataset["eval"])
+    metrics = [
+        LLMContextRecall(llm=evaluator_llm),
+        FactualCorrectness(llm=evaluator_llm),
+        Faithfulness(llm=evaluator_llm),
+        # SemanticSimilarity(embeddings=evaluator_embeddings)
+    ]
+    results = evaluate(dataset=eval_dataset, metrics=metrics)
+    print("results: ", results)
+    # Step 4: Run the Chain
+    inputs = {
+        "pdf_list": listaPDFs,
+        "user_message": serializer["user_message"],
+    }
+    # result = chain.run(inputs)
+    return Response({"msg": results})
+    # Step 5: Format the Output
+    # return {
+    #     "resultado": result["structured_summaries"],
+    #     "parametros-utilizados": {
+    #         "num_chunks_retrieval": serializer["num_chunks_retrieval"],
+    #         "embedding_weight": serializer["embedding_weight"],
+    #         "bm25_weight": serializer["bm25_weight"],
+    #         "context_window": serializer["context_window"],
+    #         "chunk_overlap": serializer["chunk_overlap"],
+    #         "num_k_rerank": serializer["num_k_rerank"],
+    #         "model_cohere_rerank": serializer["model_cohere_rerank"],
+    #         "more_initial_chunks_for_reranking": serializer["more_initial_chunks_for_reranking"],
+    #         "claude_context_model": serializer["claude_context_model"],
+    #         "gpt_temperature": serializer["gpt_temperature"],
+    #         "user_message": serializer["user_message"],
+    #         "model": serializer["model"],
+    #         "hf_embedding": serializer["hf_embedding"],
+    #         "chunk_size": serializer["chunk_size"],
+    #         "chunk_overlap": serializer["chunk_overlap"],
+    #         "prompt_relatorio": serializer["prompt_relatorio"],
+    #         "prompt_modelo": serializer["prompt_modelo"],
+    #     },
+    # }

_utils/resumo_completo_cursor.py CHANGED Viewed

@@ -1,26 +1,13 @@
 import os
-from typing import List, Dict, Tuple, Optional
-from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain_community.document_loaders import PyPDFLoader
-from langchain_huggingface import HuggingFaceEmbeddings
-from langchain_community.vectorstores import Chroma
-from langchain_community.chat_models import ChatOpenAI
-from langchain.chains import create_extraction_chain
-from langchain.prompts import PromptTemplate
-from dataclasses import dataclass
-import uuid
 import json
-from anthropic import Anthropic
-import numpy as np
-from rank_bm25 import BM25Okapi
-import logging
-from cohere import Client
-import requests
-from setup.environment import api_url
-from rest_framework.response import Response
-from langchain.schema import Document
-listaContador = []
 def reciprocal_rank_fusion(result_lists, weights=None):
     """Combine multiple ranked lists using reciprocal rank fusion"""
@@ -47,603 +34,6 @@ os.environ.get("LANGCHAIN_API_KEY")
 os.environ["LANGCHAIN_PROJECT"] = "VELLA"
-@dataclass
-class DocumentChunk:
-    content: str
-    page_number: int
-    chunk_id: str
-    start_char: int
-    end_char: int
-@dataclass
-class RetrievalConfig:
-    num_chunks: int = 5
-    embedding_weight: float = 0.5
-    bm25_weight: float = 0.5
-    context_window: int = 3
-    chunk_overlap: int = 200
-    chunk_size: int = 1000
-@dataclass
-class ContextualizedChunk(DocumentChunk):
-    context: str = ""
-    embedding: Optional[np.ndarray] = None
-    bm25_score: Optional[float] = None
-class DocumentSummarizer:
-    def __init__(
-        self,
-        openai_api_key: str,
-        cohere_api_key: str,
-        embedding_model,
-        chunk_size,
-        chunk_overlap,
-        num_k_rerank,
-        model_cohere_rerank,
-    ):
-        self.openai_api_key = openai_api_key
-        self.cohere_client = Client(cohere_api_key)
-        self.embeddings = HuggingFaceEmbeddings(model_name=embedding_model)
-        self.text_splitter = RecursiveCharacterTextSplitter(
-            chunk_size=chunk_size, chunk_overlap=chunk_overlap
-        )
-        self.chunk_metadata = {}  # Store chunk metadata for tracing
-        self.num_k_rerank = num_k_rerank
-        self.model_cohere_rerank = model_cohere_rerank
-    def load_and_split_document(self, pdf_path: str) -> List[DocumentChunk]:
-        """Load PDF and split into chunks with metadata"""
-        loader = PyPDFLoader(pdf_path)
-        pages = (
-            loader.load()
-        )  # Gera uma lista de objetos Document, sendo cada item da lista referente a UMA PÁGINA inteira do PDF.
-        chunks = []
-        char_count = 0
-        for page in pages:
-            text = page.page_content
-            page_chunks = self.text_splitter.split_text(
-                text
-            )  # Quebra o item que é um Document de UMA PÁGINA inteira em um lista onde cada item é referente a um chunk, que são pedaços menores do que uma página.
-            for chunk in page_chunks:
-                chunk_id = str(uuid.uuid4())
-                start_char = text.find(
-                    chunk
-                )  # Retorna a posição onde se encontra o chunk dentro da página inteira
-                end_char = start_char + len(chunk)
-                doc_chunk = DocumentChunk(  # Gera o objeto do chunk com informações adicionais, como a posição e id do chunk
-                    content=chunk,
-                    page_number=page.metadata.get("page") + 1,  # 1-based page numbering
-                    chunk_id=chunk_id,
-                    start_char=char_count + start_char,
-                    end_char=char_count + end_char,
-                )
-                chunks.append(doc_chunk)
-                # Store metadata for later retrieval
-                self.chunk_metadata[chunk_id] = {
-                    "page": doc_chunk.page_number,
-                    "start_char": doc_chunk.start_char,
-                    "end_char": doc_chunk.end_char,
-                }
-            char_count += len(text)
-        return chunks
-    def load_and_split_text(self, text: str) -> List[DocumentChunk]:
-        """Load Text and split into chunks with metadata - Criei essa função apenas para o ragas"""
-        page = Document(page_content=text, metadata={"page": 1})
-        chunks = []
-        char_count = 0
-        text = page.page_content
-        page_chunks = self.text_splitter.split_text(
-            text
-        )  # Quebra o item que é um Document de UMA PÁGINA inteira em um lista onde cada item é referente a um chunk, que são pedaços menores do que uma página.
-        print("\n\n\n")
-        print("page_chunks: ", page_chunks)
-        for chunk in page_chunks:
-            chunk_id = str(uuid.uuid4())
-            start_char = text.find(
-                chunk
-            )  # Retorna a posição onde se encontra o chunk dentro da página inteira
-            end_char = start_char + len(chunk)
-            doc_chunk = DocumentChunk(  # Gera o objeto do chunk com informações adicionais, como a posição e id do chunk
-                content=chunk,
-                page_number=page.metadata.get("page") + 1,  # 1-based page numbering
-                chunk_id=chunk_id,
-                start_char=char_count + start_char,
-                end_char=char_count + end_char,
-            )
-            chunks.append(doc_chunk)
-            # Store metadata for later retrieval
-            self.chunk_metadata[chunk_id] = {
-                "page": doc_chunk.page_number,
-                "start_char": doc_chunk.start_char,
-                "end_char": doc_chunk.end_char,
-            }
-        char_count += len(text)
-        return chunks
-    def create_vector_store(
-        self, chunks: List[DocumentChunk]
-    ) -> Chroma:  # Esta função nunca está sendo utilizada
-        """Create vector store with metadata"""
-        texts = [chunk.content for chunk in chunks]
-        metadatas = [
-            {
-                "chunk_id": chunk.chunk_id,
-                "page": chunk.page_number,
-                "start_char": chunk.start_char,
-                "end_char": chunk.end_char,
-            }
-            for chunk in chunks
-        ]
-        vector_store = Chroma.from_texts(
-            texts=texts, metadatas=metadatas, embedding=self.embeddings
-        )
-        return vector_store
-    def rerank_chunks(  # Esta função nunca está sendo utilizada
-        self, chunks: List[Dict], query: str, k: int = 5
-    ) -> List[Dict]:
-        """
-        Rerank chunks using Cohere's reranking model.
-        Args:
-            chunks: List of dictionaries containing chunks and their metadata
-            query: Original search query
-            k: Number of top chunks to return
-        Returns:
-            List of reranked chunks with updated relevance scores
-        """
-        try:
-            # Prepare documents for reranking
-            documents = [chunk["content"] for chunk in chunks]
-            # Get reranking scores from Cohere
-            results = self.cohere_client.rerank(
-                query=query,
-                documents=documents,
-                top_n=k,
-                model=self.model_cohere_rerank,
-            )
-            # Create reranked results with original metadata
-            reranked_chunks = []
-            for hit in results:
-                original_chunk = chunks[hit.index]
-                reranked_chunks.append(
-                    {**original_chunk, "relevance_score": hit.relevance_score}
-                )
-            return reranked_chunks
-        except Exception as e:
-            logging.error(f"Reranking failed: {str(e)}")
-            return chunks[:k]  # Fallback to original ordering
-    def generate_summary_with_sources(  # Esta função nunca está sendo utilizada
-        self,
-        vector_store: Chroma,
-        query: str = "Summarize the main points of this document",
-    ) -> List[Dict]:
-        """Generate summary with source citations using reranking"""
-        # Retrieve more initial chunks for reranking
-        relevant_docs = vector_store.similarity_search_with_score(query, k=20)
-        # Prepare chunks for reranking
-        chunks = []
-        for doc, score in relevant_docs:
-            chunks.append(
-                {
-                    "content": doc.page_content,
-                    "page": doc.metadata["page"],
-                    "chunk_id": doc.metadata["chunk_id"],
-                    "relevance_score": score,
-                }
-            )
-        # Rerank chunks
-        reranked_chunks = self.rerank_chunks(chunks, query, k=self.num_k_rerank)
-        # Prepare context and sources from reranked chunks
-        contexts = []
-        sources = []
-        for chunk in reranked_chunks:
-            contexts.append(chunk["content"])
-            sources.append(
-                {
-                    "content": chunk["content"],
-                    "page": chunk["page"],
-                    "chunk_id": chunk["chunk_id"],
-                    "relevance_score": chunk["relevance_score"],
-                }
-            )
-        prompt_template = """
-        Based on the following context, provide multiple key points from the document.
-        For each point, create a new paragraph.
-        Each paragraph should be a complete, self-contained insight.
-        Context: {context}
-        Key points:
-        """
-        prompt = PromptTemplate(template=prompt_template, input_variables=["context"])
-        llm = ChatOpenAI(
-            temperature=0, model_name="gpt-4o-mini", api_key=self.openai_api_key
-        )
-        response = llm.predict(prompt.format(context="\n\n".join(contexts)))
-        # Split the response into paragraphs
-        summaries = [p.strip() for p in response.split("\n\n") if p.strip()]
-        # Create structured output
-        structured_output = []
-        for idx, summary in enumerate(summaries):
-            # Associate each summary with the most relevant source
-            structured_output.append(
-                {
-                    "content": summary,
-                    "source": {
-                        "page": sources[min(idx, len(sources) - 1)]["page"],
-                        "text": sources[min(idx, len(sources) - 1)]["content"][:200]
-                        + "...",
-                        "relevance_score": sources[min(idx, len(sources) - 1)][
-                            "relevance_score"
-                        ],
-                    },
-                }
-            )
-        return structured_output
-    def get_source_context(
-        self, chunk_id: str, window: int = 100
-    ) -> Dict:  # Esta função nunca está sendo utilizada
-        """Get extended context around a specific chunk"""
-        metadata = self.chunk_metadata.get(chunk_id)
-        if not metadata:
-            return None
-        return {
-            "page": metadata["page"],
-            "start_char": metadata["start_char"],
-            "end_char": metadata["end_char"],
-        }
-class ContextualRetriever:
-    def __init__(
-        self, config: RetrievalConfig, claude_api_key: str, claude_context_model
-    ):
-        self.config = config  # Este self.config no momento não está sendo utilizada para nada dentro desta classe. Analisar se deveria estar sendo utilizada.
-        self.claude_client = Anthropic(api_key=claude_api_key)
-        self.logger = logging.getLogger(__name__)
-        self.bm25 = None
-        self.claude_context_model = claude_context_model
-    def generate_context(self, full_text: str, chunk: DocumentChunk) -> str:
-        """Generate contextual description using Claude"""
-        try:
-            # prompt = f"""<document>
-            # {full_text}
-            # </document>
-            # Here is the chunk we want to situate within the whole document
-            # <chunk>
-            # {chunk.content}
-            # </chunk>
-            # Please give a short succinct context to situate this chunk within the overall document for the purposes of improving search retrieval of the chunk. Answer only with the succinct context and nothing else."""
-            prompt = f"""You are a language model tasked with providing context to improve the retrieval of information from a chunk extracted from a document. Follow these steps internally (do not display reasoning or reflection in the final output):
-1. **Chain of Thought (internal)**:
-- Identify the document ID, which is the value between "NUM." and "- Pág".
-- Identify the document name from the header.
-2. **Reflection (internal)**:
-- Confirm the document ID and name are correctly identified.
-- Ensure the final context is concise and helpful.
-3. **Final Response**:
-- Provide a short context situating the *chunk* within the document, including the document ID and document name.
-- Do not include any reasoning or reflection in your response.
-**Example Usage:**
-```
-<document> {full_text} </document>
-<chunk> {chunk.content} </chunk>
-Please return only the succinct context (without displaying your internal reasoning), including the document ID and the document name.
-```
-"""
-            response = self.claude_client.messages.create(
-                model=self.claude_context_model,
-                max_tokens=100,
-                messages=[{"role": "user", "content": prompt}],
-            )
-            return response.content[
-                0
-            ].text  # O response.content é uma lista pois é passada uma lista de mensagens, e também retornado uma lista de mensagens, sendo a primeira a mais recente, que é a resposta do model
-        except Exception as e:
-            self.logger.error(
-                f"Context generation failed for chunk {chunk.chunk_id}: {str(e)}"
-            )
-            return ""
-    def contextualize_chunks(
-        self, full_text: List[Document], chunks: List[DocumentChunk]
-    ) -> List[
-        ContextualizedChunk
-    ]:  # Pega um chunk e apenas adiciona uma propriedade de contexto a ela, sendo esta propriedade a resposta da função acima, que chama um Model do Claude para dizer o contexto de um chunk
-        """Add context to all chunks"""
-        smaller_context = ""
-        contextualized_chunks = []
-        print("\n\n")
-        print("len(chunks): ", len(chunks))
-        for chunk in chunks:
-            contador_pagina = -1
-            while contador_pagina <= 1:
-                local_page = full_text[chunk.page_number + contador_pagina]
-                if local_page:
-                    smaller_context += local_page.page_content
-                contador_pagina += 1
-            print("chunk.page_number: ", chunk.page_number)
-            context = self.generate_context(smaller_context, chunk)
-            contextualized_chunk = ContextualizedChunk(
-                content=chunk.content,
-                page_number=chunk.page_number,
-                chunk_id=chunk.chunk_id,
-                start_char=chunk.start_char,
-                end_char=chunk.end_char,
-                context=context,
-            )
-            contextualized_chunks.append(contextualized_chunk)
-        return contextualized_chunks
-class EnhancedDocumentSummarizer(DocumentSummarizer):
-    def __init__(
-        self,
-        openai_api_key: str,
-        claude_api_key: str,
-        config: RetrievalConfig,
-        embedding_model,
-        chunk_size,
-        chunk_overlap,
-        num_k_rerank,
-        model_cohere_rerank,
-        claude_context_model,
-        prompt_relatorio,
-        gpt_model,
-        gpt_temperature,
-        id_modelo_do_usuario,
-        prompt_modelo,
-    ):
-        super().__init__(
-            openai_api_key,
-            os.environ.get("COHERE_API_KEY"),
-            embedding_model,
-            chunk_size,
-            chunk_overlap,
-            num_k_rerank,
-            model_cohere_rerank,
-        )
-        self.config = config
-        self.contextual_retriever = ContextualRetriever(
-            config, claude_api_key, claude_context_model
-        )
-        self.logger = logging.getLogger(__name__)
-        self.prompt_relatorio = prompt_relatorio
-        self.gpt_model = gpt_model
-        self.gpt_temperature = gpt_temperature
-        self.id_modelo_do_usuario = id_modelo_do_usuario
-        self.prompt_modelo = prompt_modelo
-    def create_enhanced_vector_store(
-        self, chunks: List[ContextualizedChunk]
-    ) -> Tuple[Chroma, BM25Okapi, List[str]]:
-        """Create vector store and BM25 index with contextualized chunks"""
-        try:
-            # Prepare texts with context
-            texts = [f"{chunk.context} {chunk.content}" for chunk in chunks]
-            # Create vector store
-            metadatas = [
-                {
-                    "chunk_id": chunk.chunk_id,
-                    "page": chunk.page_number,
-                    "start_char": chunk.start_char,
-                    "end_char": chunk.end_char,
-                    "context": chunk.context,
-                }
-                for chunk in chunks
-            ]
-            vector_store = Chroma.from_texts(
-                texts=texts, metadatas=metadatas, embedding=self.embeddings
-            )
-            # Create BM25 index
-            tokenized_texts = [text.split() for text in texts]
-            bm25 = BM25Okapi(tokenized_texts)
-            # Get chunk IDs in order
-            chunk_ids = [chunk.chunk_id for chunk in chunks]
-            return vector_store, bm25, chunk_ids
-        except Exception as e:
-            self.logger.error(f"Error creating enhanced vector store: {str(e)}")
-            raise
-    def retrieve_with_rank_fusion(
-        self, vector_store: Chroma, bm25: BM25Okapi, chunk_ids: List[str], query: str
-    ) -> List[Dict]:
-        """Combine embedding and BM25 retrieval results"""
-        try:
-            # Get embedding results
-            embedding_results = vector_store.similarity_search_with_score(
-                query, k=self.config.num_chunks
-            )
-            # Convert embedding results to list of (chunk_id, score)
-            embedding_list = [
-                (doc.metadata["chunk_id"], 1 / (1 + score))
-                for doc, score in embedding_results
-            ]
-            # Get BM25 results
-            tokenized_query = query.split()
-            bm25_scores = bm25.get_scores(tokenized_query)
-            # Convert BM25 scores to list of (chunk_id, score)
-            bm25_list = [
-                (chunk_ids[i], float(score)) for i, score in enumerate(bm25_scores)
-            ]
-            # Sort bm25_list by score in descending order and limit to top N results
-            bm25_list = sorted(bm25_list, key=lambda x: x[1], reverse=True)[
-                : self.config.num_chunks
-            ]
-            # Normalize BM25 scores
-            max_bm25 = max([score for _, score in bm25_list]) if bm25_list else 1
-            bm25_list = [(doc_id, score / max_bm25) for doc_id, score in bm25_list]
-            # Pass the lists to rank fusion
-            result_lists = [embedding_list, bm25_list]
-            weights = [self.config.embedding_weight, self.config.bm25_weight]
-            combined_results = reciprocal_rank_fusion(result_lists, weights=weights)
-            return combined_results
-        except Exception as e:
-            self.logger.error(f"Error in rank fusion retrieval: {str(e)}")
-            raise
-    def generate_enhanced_summary(
-        self,
-        vector_store: Chroma,
-        bm25: BM25Okapi,
-        chunk_ids: List[str],
-        query: str = "Summarize the main points of this document",
-    ) -> List[Dict]:
-        """Generate enhanced summary using both vector and BM25 retrieval"""
-        try:
-            # Get combined results using rank fusion
-            ranked_results = self.retrieve_with_rank_fusion(
-                vector_store, bm25, chunk_ids, query
-            )
-            # Prepare context and track sources
-            contexts = []
-            sources = []
-            # Get full documents for top results
-            for chunk_id, score in ranked_results[: self.config.num_chunks]:
-                results = vector_store.get(
-                    where={"chunk_id": chunk_id}, include=["documents", "metadatas"]
-                )
-                if results["documents"]:
-                    context = results["documents"][0]
-                    metadata = results["metadatas"][0]
-                    contexts.append(context)
-                    sources.append(
-                        {
-                            "content": context,
-                            "page": metadata["page"],
-                            "chunk_id": chunk_id,
-                            "relevance_score": score,
-                            "context": metadata.get("context", ""),
-                        }
-                    )
-            url_request = f"{api_url}/modelo/{self.id_modelo_do_usuario}"
-            resposta = requests.get(url_request)
-            if resposta.status_code != 200:
-                return Response(
-                    {
-                        "error": "Ocorreu um problema. Pode ser que o modelo não tenha sido encontrado. Tente novamente e/ou entre em contato com a equipe técnica"
-                    }
-                )
-            modelo_buscado = resposta.json()["modelo"]
-            llm = ChatOpenAI(
-                temperature=self.gpt_temperature,
-                model_name=self.gpt_model,
-                api_key=self.openai_api_key,
-            )
-            prompt_gerar_relatorio = PromptTemplate(
-                template=self.prompt_relatorio, input_variables=["context"]
-            )
-            relatorio_gerado = llm.predict(
-                prompt_gerar_relatorio.format(context="\n\n".join(contexts))
-            )
-            prompt_gerar_modelo = PromptTemplate(
-                template=self.prompt_modelo,
-                input_variables=["context", "modelo_usuario"],
-            )
-            modelo_gerado = llm.predict(
-                prompt_gerar_modelo.format(
-                    context=relatorio_gerado, modelo_usuario=modelo_buscado
-                )
-            )
-            # Split the response into paragraphs
-            summaries = [p.strip() for p in modelo_gerado.split("\n\n") if p.strip()]
-            # Create structured output
-            structured_output = []
-            for idx, summary in enumerate(summaries):
-                source_idx = min(idx, len(sources) - 1)
-                structured_output.append(
-                    {
-                        "content": summary,
-                        "source": {
-                            "page": sources[source_idx]["page"],
-                            "text": sources[source_idx]["content"][:200] + "...",
-                            "context": sources[source_idx]["context"],
-                            "relevance_score": sources[source_idx]["relevance_score"],
-                            "chunk_id": sources[source_idx]["chunk_id"],
-                        },
-                    }
-                )
-            return structured_output
-        except Exception as e:
-            self.logger.error(f"Error generating enhanced summary: {str(e)}")
-            raise
 async def get_llm_summary_answer_by_cursor_complete(
     serializer, listaPDFs=None, contexto=None
 ):
@@ -675,6 +65,7 @@ async def get_llm_summary_answer_by_cursor_complete(
         gpt_temperature=serializer["gpt_temperature"],
         id_modelo_do_usuario=serializer["id_modelo_do_usuario"],
         prompt_modelo=serializer["prompt_modelo"],
     )
     full_text = ""
@@ -699,18 +90,61 @@ async def get_llm_summary_answer_by_cursor_complete(
         full_text = " ".join([page.page_content for page in pages])
     # Contextualize chunks
-    contextualized_chunks = await summarizer.contextual_retriever.contextualize_chunks(
-        pages, allPdfsChunks
-    )
     # Create enhanced vector store and BM25 index
     vector_store, bm25, chunk_ids = summarizer.create_enhanced_vector_store(
-        contextualized_chunks
     )
     # Generate enhanced summary
     structured_summaries = summarizer.generate_enhanced_summary(
-        vector_store, bm25, chunk_ids, serializer["user_message"]
     )
     # Output results as JSON
@@ -719,7 +153,7 @@ async def get_llm_summary_answer_by_cursor_complete(
     print(json_output)
     texto_completo = ""
     for x in structured_summaries:
-        texto_completo = texto_completo + x["content"]
     return {
         "resultado": structured_summaries,
         "texto_completo": texto_completo,
@@ -745,169 +179,3 @@ async def get_llm_summary_answer_by_cursor_complete(
             "prompt_modelo": serializer["prompt_modelo"],
         },
     }
-from ragas import evaluate
-from langchain.chains import SequentialChain
-from langchain.prompts import PromptTemplate
-# from langchain.schema import ChainResult
-from langchain.memory import SimpleMemory
-def test_ragas(serializer, listaPDFs):
-    # Step 2: Setup RetrievalConfig and EnhancedDocumentSummarizer
-    config = RetrievalConfig(
-        num_chunks=serializer["num_chunks_retrieval"],
-        embedding_weight=serializer["embedding_weight"],
-        bm25_weight=serializer["bm25_weight"],
-        context_window=serializer["context_window"],
-        chunk_overlap=serializer["chunk_overlap"],
-    )
-    summarizer = EnhancedDocumentSummarizer(
-        openai_api_key=os.environ.get("OPENAI_API_KEY"),
-        claude_api_key=os.environ.get("CLAUDE_API_KEY"),
-        config=config,
-        embedding_model=serializer["hf_embedding"],
-        chunk_overlap=serializer["chunk_overlap"],
-        chunk_size=serializer["chunk_size"],
-        num_k_rerank=serializer["num_k_rerank"],
-        model_cohere_rerank=serializer["model_cohere_rerank"],
-        claude_context_model=serializer["claude_context_model"],
-        prompt_relatorio=serializer["prompt_relatorio"],
-        gpt_model=serializer["model"],
-        gpt_temperature=serializer["gpt_temperature"],
-        id_modelo_do_usuario=serializer["id_modelo_do_usuario"],
-        prompt_modelo=serializer["prompt_modelo"],
-    )
-    # Step 1: Define the components
-    def load_and_split_documents(pdf_list, summarizer):
-        """Loads and splits PDF documents into chunks."""
-        all_chunks = []
-        for pdf_path in pdf_list:
-            chunks = summarizer.load_and_split_document(pdf_path)
-            all_chunks.extend(chunks)
-        return {"chunks": all_chunks}
-    def get_full_text_from_pdfs(pdf_list):
-        """Gets the full text from PDFs for contextualization."""
-        full_text = []
-        for pdf_path in pdf_list:
-            loader = PyPDFLoader(pdf_path)
-            pages = loader.load()
-            text = " ".join([page.page_content for page in pages])
-            full_text.append(text)
-        return {"full_text": " ".join(full_text)}
-    def contextualize_chunks(full_text, chunks, contextual_retriever):
-        """Adds context to chunks using Claude."""
-        contextualized_chunks = contextual_retriever.contextualize_chunks(
-            full_text, chunks
-        )
-        return {"contextualized_chunks": contextualized_chunks}
-    def create_vector_store(contextualized_chunks, summarizer):
-        """Creates an enhanced vector store and BM25 index."""
-        vector_store, bm25, chunk_ids = summarizer.create_enhanced_vector_store(
-            contextualized_chunks
-        )
-        return {"vector_store": vector_store, "bm25": bm25, "chunk_ids": chunk_ids}
-    def generate_summary(vector_store, bm25, chunk_ids, query, summarizer):
-        """Generates an enhanced summary using the vector store and BM25 index."""
-        structured_summaries = summarizer.generate_enhanced_summary(
-            vector_store, bm25, chunk_ids, query
-        )
-        return {"structured_summaries": structured_summaries}
-    # Step 3: Define Sequential Chain
-    chain = SequentialChain(
-        chains=[
-            lambda inputs: load_and_split_documents(inputs["pdf_list"], summarizer),
-            lambda inputs: get_full_text_from_pdfs(inputs["pdf_list"]),
-            lambda inputs: contextualize_chunks(
-                inputs["full_text"], inputs["chunks"], summarizer.contextual_retriever
-            ),
-            lambda inputs: create_vector_store(
-                inputs["contextualized_chunks"], summarizer
-            ),
-            lambda inputs: generate_summary(
-                inputs["vector_store"],
-                inputs["bm25"],
-                inputs["chunk_ids"],
-                inputs["user_message"],
-                summarizer,
-            ),
-        ],
-        input_variables=["pdf_list", "user_message"],
-        output_variables=["structured_summaries"],
-    )
-    from ragas.langchain.evalchain import RagasEvaluatorChain
-    from ragas.metrics import (
-        LLMContextRecall,
-        Faithfulness,
-        FactualCorrectness,
-        SemanticSimilarity,
-    )
-    from ragas import evaluate
-    from ragas.llms import LangchainLLMWrapper
-    # from ragas.embeddings import LangchainEmbeddingsWrapper
-    # evaluator_llm = LangchainLLMWrapper(ChatOpenAI(model="gpt-4o-mini"))
-    evaluator_llm = LangchainLLMWrapper(chain)
-    # evaluator_embeddings = LangchainEmbeddingsWrapper(OpenAIEmbeddings())
-    from datasets import load_dataset
-    dataset = load_dataset(
-        "explodinggradients/amnesty_qa", "english_v3", trust_remote_code=True
-    )
-    from ragas import EvaluationDataset
-    eval_dataset = EvaluationDataset.from_hf_dataset(dataset["eval"])
-    metrics = [
-        LLMContextRecall(llm=evaluator_llm),
-        FactualCorrectness(llm=evaluator_llm),
-        Faithfulness(llm=evaluator_llm),
-        # SemanticSimilarity(embeddings=evaluator_embeddings)
-    ]
-    results = evaluate(dataset=eval_dataset, metrics=metrics)
-    print("results: ", results)
-    # Step 4: Run the Chain
-    inputs = {
-        "pdf_list": listaPDFs,
-        "user_message": serializer["user_message"],
-    }
-    # result = chain.run(inputs)
-    return Response({"msg": results})
-    # Step 5: Format the Output
-    # return {
-    #     "resultado": result["structured_summaries"],
-    #     "parametros-utilizados": {
-    #         "num_chunks_retrieval": serializer["num_chunks_retrieval"],
-    #         "embedding_weight": serializer["embedding_weight"],
-    #         "bm25_weight": serializer["bm25_weight"],
-    #         "context_window": serializer["context_window"],
-    #         "chunk_overlap": serializer["chunk_overlap"],
-    #         "num_k_rerank": serializer["num_k_rerank"],
-    #         "model_cohere_rerank": serializer["model_cohere_rerank"],
-    #         "more_initial_chunks_for_reranking": serializer["more_initial_chunks_for_reranking"],
-    #         "claude_context_model": serializer["claude_context_model"],
-    #         "gpt_temperature": serializer["gpt_temperature"],
-    #         "user_message": serializer["user_message"],
-    #         "model": serializer["model"],
-    #         "hf_embedding": serializer["hf_embedding"],
-    #         "chunk_size": serializer["chunk_size"],
-    #         "chunk_overlap": serializer["chunk_overlap"],
-    #         "prompt_relatorio": serializer["prompt_relatorio"],
-    #         "prompt_modelo": serializer["prompt_modelo"],
-    #     },
-    # }

 import os
 from langchain_community.document_loaders import PyPDFLoader
 import json
+from _utils.gerar_relatorio_modelo_usuario.EnhancedDocumentSummarizer import (
+    EnhancedDocumentSummarizer,
+)
+from _utils.models.gerar_relatorio import (
+    RetrievalConfig,
+)
 def reciprocal_rank_fusion(result_lists, weights=None):
     """Combine multiple ranked lists using reciprocal rank fusion"""
 os.environ["LANGCHAIN_PROJECT"] = "VELLA"
 async def get_llm_summary_answer_by_cursor_complete(
     serializer, listaPDFs=None, contexto=None
 ):
         gpt_temperature=serializer["gpt_temperature"],
         id_modelo_do_usuario=serializer["id_modelo_do_usuario"],
         prompt_modelo=serializer["prompt_modelo"],
+        reciprocal_rank_fusion=reciprocal_rank_fusion,
     )
     full_text = ""
         full_text = " ".join([page.page_content for page in pages])
     # Contextualize chunks
+    if serializer["should_have_contextual_chunks"]:
+        contextualized_chunks = (
+            await summarizer.contextual_retriever.contextualize_all_chunks(
+                pages, allPdfsChunks
+            )
+        )
+        chunks_passados = contextualized_chunks
+        is_contextualized_chunk = True
+    else:
+        chunks_passados = allPdfsChunks
+        is_contextualized_chunk = False
     # Create enhanced vector store and BM25 index
     vector_store, bm25, chunk_ids = summarizer.create_enhanced_vector_store(
+        chunks_passados, is_contextualized_chunk
     )
+    prompt_relatorio_sem_context = """ You are a language model specialized in producing concise and well-structured legal case summaries in Portuguese. You will receive a variable `context`, which contains information about a legal case. Your task is to read the `context` carefully and produce a summary report in Portuguese, following the specific format provided below. Do not include any additional comments or reasoning steps in your final answer.
+**Instructions**:
+1. **Chain of Thought**: Before producing your final answer, you must think through and plan your summary silently, without showing this reasoning in the final output. The final answer must only contain the required formatted report and nothing else.
+2. **Reading the Context**: Extract the following information from `context`:
+- The name of the defendant (réu).
+- The crime they have been accused of (nome_do_crime).
+- The applicable article and subsection of the Penal Code (artigo_e_inciso_do_crime).
+- The date the accusation was accepted (data_do_recebimento).
+- The ID of the decision document (id_do_documento).
+3. **Prescriptive Details**: If no other interruptive or suspensive causes of prescription are mentioned, confirm that there are none.
+4. **Formatting**: Your final answer must strictly follow the format below, in Portuguese, and replace the placeholders with the appropriate information:
+```
+<formato>
+Trata-se de Ação Penal em que o Ministério Público denunciou [nome_do_reu], pela prática do [nome_do_crime] [artigo_e_inciso_do_crime], do Código Penal.
+A denúncia foi recebida em [data_do_recebimento], conforme Decisão [id_do_documento].
+Não há outras causas interruptivas ou suspensivas da prescrição.
+</formato>
+```
+5. **Completeness**: If any piece of required information is missing in the `context`, note that explicitly in the final answer within the format.
+**Reminder**:
+- Do not include your chain of thought in the final output.
+- Do not add extra information or commentary beyond the specified format.
+- The final answer must be in Portuguese.
+```
+<formato>
+Trata-se de Ação Penal em que o Ministério Público denunciou João da Silva, pela prática do furto qualificado (art. 155, §4º, inciso II do Código Penal).
+A denúncia foi recebida em 12/03/2021, conforme Decisão 20210312-01.
+Não há outras causas interruptivas ou suspensivas da prescrição.
+</formato>
+"""
     # Generate enhanced summary
     structured_summaries = summarizer.generate_enhanced_summary(
+        vector_store,
+        bm25,
+        chunk_ids
+        # , serializer["user_message"]
+        ,
+        prompt_relatorio_sem_context,
     )
     # Output results as JSON
     print(json_output)
     texto_completo = ""
     for x in structured_summaries:
+        texto_completo = texto_completo + x["content"] + "\n"
     return {
         "resultado": structured_summaries,
         "texto_completo": texto_completo,
             "prompt_modelo": serializer["prompt_modelo"],
         },
     }

gerar_relatorio_modelo_usuario/__init__.py ADDED Viewed

File without changes

gerar_relatorio_modelo_usuario/admin.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ from django.contrib import admin
2	+
3	+ # Register your models here.

gerar_relatorio_modelo_usuario/apps.py ADDED Viewed

	@@ -0,0 +1,6 @@

+from django.apps import AppConfig
+class GerarRelatorioModeloUsuarioConfig(AppConfig):
+    default_auto_field = 'django.db.models.BigAutoField'
+    name = 'gerar_relatorio_modelo_usuario'

gerar_relatorio_modelo_usuario/migrations/__init__.py ADDED Viewed

File without changes

gerar_relatorio_modelo_usuario/models.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ from django.db import models
2	+
3	+ # Create your models here.

gerar_relatorio_modelo_usuario/serializer.py ADDED Viewed

	@@ -0,0 +1,33 @@

+from rest_framework import serializers
+from resumos.serializer import ResumoCursorSerializer
+from _utils.gerar_relatorio_modelo_usuario.prompts import (
+    system_prompt_modelo,
+    system_prompt_relatorio,
+)
+user_message = "What are the main points of this document?"
+class ResumoCursorCompeltoSerializer(ResumoCursorSerializer):
+    system_prompt = None
+    prompt_relatorio = serializers.CharField(
+        required=False, default=system_prompt_relatorio
+    )
+    prompt_modelo = serializers.CharField(required=False, default=system_prompt_modelo)
+    user_message = serializers.CharField(required=False, default=user_message)
+    num_chunks_retrieval = serializers.IntegerField(default=5)
+    embedding_weight = serializers.FloatField(default=0.5)
+    bm25_weight = serializers.FloatField(default=0.5)
+    context_window = serializers.IntegerField(default=3)
+    chunk_overlap = serializers.IntegerField(default=200)
+    num_k_rerank = serializers.IntegerField(default=5)
+    model_cohere_rerank = serializers.CharField(
+        required=False, default="rerank-english-v2.0"
+    )
+    more_initial_chunks_for_reranking = serializers.IntegerField(default=20)
+    claude_context_model = serializers.CharField(
+        required=False, default="claude-3-haiku-20240307"
+    )
+    gpt_temperature = serializers.FloatField(default=0)
+    id_modelo_do_usuario = serializers.IntegerField(required=True)
+    should_have_contextual_chunks = serializers.BooleanField(default=False)

gerar_relatorio_modelo_usuario/tests.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ from django.test import TestCase
2	+
3	+ # Create your tests here.

gerar_relatorio_modelo_usuario/views.py ADDED Viewed

	@@ -0,0 +1,60 @@

+from rest_framework.views import APIView
+from adrf.views import APIView as AsyncAPIView
+import tempfile, os
+from rest_framework.response import Response
+from _utils.resumo_completo_cursor import (
+    get_llm_summary_answer_by_cursor_complete,
+)
+from .serializer import (
+    ResumoCursorCompeltoSerializer,
+)
+from rest_framework.parsers import MultiPartParser
+from drf_spectacular.utils import extend_schema
+class ResumoSimplesCursorCompletoView(AsyncAPIView):
+    parser_classes = [MultiPartParser]
+    @extend_schema(
+        request=ResumoCursorCompeltoSerializer,
+    )
+    async def post(self, request):
+        serializer = ResumoCursorCompeltoSerializer(data=request.data)
+        if serializer.is_valid(raise_exception=True):
+            print("\n\n\n")
+            print("serializer.validated_data: ", serializer.validated_data)
+            print("\n\n\n")
+            listaPDFs = []
+            data = serializer.validated_data
+            print("\nserializer.validated_data: ", serializer.validated_data)
+            for file in serializer.validated_data["files"]:
+                file.seek(0)
+                with tempfile.NamedTemporaryFile(
+                    delete=False, suffix=".pdf"
+                ) as temp_file:  # Create a temporary file to save the uploaded PDF
+                    for (
+                        chunk
+                    ) in (
+                        file.chunks()
+                    ):  # Write the uploaded file content to the temporary file
+                        temp_file.write(chunk)
+                    temp_file_path = (
+                        temp_file.name
+                    )  # Get the path of the temporary file
+                    listaPDFs.append(temp_file_path)
+            print("listaPDFs: ", listaPDFs)
+            resposta_llm = await get_llm_summary_answer_by_cursor_complete(
+                data, listaPDFs
+            )
+            final = resposta_llm
+            print("\n\n\n")
+            print("final: ", final)
+            for file in listaPDFs:
+                os.remove(file)
+            return Response({"resposta": final})

ragas_api/serializer.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from rest_framework import serializers
-from resumos.serializer import ResumoCursorCompeltoSerializer
 class RagasSerializer(ResumoCursorCompeltoSerializer):

 from rest_framework import serializers
+from gerar_relatorio_modelo_usuario.serializer import ResumoCursorCompeltoSerializer
 class RagasSerializer(ResumoCursorCompeltoSerializer):

ragas_api/views.py CHANGED Viewed

@@ -2,9 +2,9 @@ from rest_framework.views import APIView
 import tempfile, os
 from rest_framework.response import Response
 from _utils.resumo_completo_cursor import (
     get_llm_summary_answer_by_cursor_complete,
-    test_ragas,
 )
 from .serializer import (
     RagasFromTextSerializer,

 import tempfile, os
 from rest_framework.response import Response
+from _utils.ragas import test_ragas
 from _utils.resumo_completo_cursor import (
     get_llm_summary_answer_by_cursor_complete,
 )
 from .serializer import (
     RagasFromTextSerializer,

resumos/serializer.py CHANGED Viewed

@@ -27,127 +27,3 @@ class ResumoCursorSerializer(serializers.Serializer):
     hf_embedding = serializers.CharField(required=False, default="all-MiniLM-L6-v2")
     chunk_size = serializers.IntegerField(required=False, default=1000)
     chunk_overlap = serializers.IntegerField(required=False, default=200)
-# system_prompt_relatorio = """
-#             Based on the following context, provide multiple key points from the document.
-#             For each point, create a new paragraph.
-#             Each paragraph should be a complete, self-contained insight.
-#             Include any relevant context provided.
-#             Context: {context}
-#             Key points:
-#             """
-system_prompt_relatorio = """
-You are a language model specialized in producing concise and well-structured legal case summaries in Portuguese. You will receive a variable `context`, which contains information about a legal case. Your task is to read the `context` carefully and produce a summary report in Portuguese, following the specific format provided below. Do not include any additional comments or reasoning steps in your final answer.
-**Instructions**:
-1. **Chain of Thought**: Before producing your final answer, you must think through and plan your summary silently, without showing this reasoning in the final output. The final answer must only contain the required formatted report and nothing else.
-2. **Reading the Context**: Extract the following information from `context`:
-- The name of the defendant (réu).
-- The crime they have been accused of (nome_do_crime).
-- The applicable article and subsection of the Penal Code (artigo_e_inciso_do_crime).
-- The date the accusation was accepted (data_do_recebimento).
-- The ID of the decision document (id_do_documento).
-3. **Prescriptive Details**: If no other interruptive or suspensive causes of prescription are mentioned, confirm that there are none.
-4. **Formatting**: Your final answer must strictly follow the format below, in Portuguese, and replace the placeholders with the appropriate information:
-```
-<formato>
-Trata-se de Ação Penal em que o Ministério Público denunciou [nome_do_reu], pela prática do [nome_do_crime] [artigo_e_inciso_do_crime], do Código Penal.
-A denúncia foi recebida em [data_do_recebimento], conforme Decisão [id_do_documento].
-Não há outras causas interruptivas ou suspensivas da prescrição.
-</formato>
-```
-5. **Completeness**: If any piece of required information is missing in the `context`, note that explicitly in the final answer within the format.
-**Reminder**:
-- Do not include your chain of thought in the final output.
-- Do not add extra information or commentary beyond the specified format.
-- The final answer must be in Portuguese.
----
-**Contextual Information (provided separately):**
-{context}
----
-**Example with a given context**:
-- Input:
-`context` = "Em 10/03/2021, o Ministério Público denunciou João da Silva, imputando-lhe o crime de furto qualificado, previsto no art. 155, §4º, inciso II, do Código Penal. A denúncia foi recebida em 12/03/2021, conforme Decisão nº 20210312-01. Não há menção a qualquer causa interruptiva ou suspensiva da prescrição."
-- Expected final answer:
-```
-<formato>
-Trata-se de Ação Penal em que o Ministério Público denunciou João da Silva, pela prática do furto qualificado (art. 155, §4º, inciso II do Código Penal).
-A denúncia foi recebida em 12/03/2021, conforme Decisão 20210312-01.
-Não há outras causas interruptivas ou suspensivas da prescrição.
-</formato>
-"""
-user_message = "What are the main points of this document?"
-# system_prompt_modelo = """
-#             Based on the following context, provide multiple key points from the document.
-#             For each point, create a new paragraph.
-#             Each paragraph should be a complete, self-contained insight.
-#             Include any relevant context provided.
-#             Context: {context}
-#             Modelo do usuário: {modelo_usuario}
-#             Key points:
-#             """
-system_prompt_modelo = """
-You are a large language model that must produce a single final sentence in **Portuguese**. To do this, you will follow a private chain of thought and then produce a final answer. The final answer must follow the formatting and stylistic conventions shown in the user-provided model `user's template`. The information to be included in the final sentence is derived from the `context` (a report describing a legal case).
-**Contextual Information (provided separately):**
-{context}
-**User Model (provided separately):**
-{modelo_do_usuario}
-**Instructions:**
-1. **Goal:** Produce one single final sentence in Portuguese that matches the structure, format, and style given by `user's template`.
-2. **Chain of Thought (private to the assistant and not to be shown in the final answer):**
-- Carefully review the `context` which is a legal report of a case.
-- Identify:
-- The defendant’s name.
-- The crime’s name, its article, and any subsection (inciso).
-- The date of receipt of the complaint (data do recebimento da denúncia).
-- The document ID.
-- Ensure these elements are correctly incorporated into the final sentence.
-- Check compliance with the formatting style indicated by `user's template`.
-- Compose the sentence following the structure from the user model.
-- Use reflection: Before finalizing the answer, reassess if all required information is included, if the format matches the user model, and if the sentence is written correctly in Portuguese.
-3. **Reflection Technique (private):**
-After composing the sentence, but before presenting it as the final answer, reflect if:
-- All required details from the `context` are accurately included.
-- The sentence format strictly matches the pattern of `user's template`.
-- The sentence is grammatically correct in Portuguese.
-4. **Final Answer:**
-- After completing the chain of thought and ensuring correctness through reflection, present only the final sentence in Portuguese.
-- Do not show the chain of thought or the reflection step. Only the final formatted sentence should be visible to the user.
-"""
-class ResumoCursorCompeltoSerializer(ResumoCursorSerializer):
-    system_prompt = None
-    prompt_relatorio = serializers.CharField(required=False, default=system_prompt_relatorio)
-    prompt_modelo = serializers.CharField(required=False, default=system_prompt_modelo)
-    user_message = serializers.CharField(required=False, default=user_message)
-    num_chunks_retrieval = serializers.IntegerField(default=5)
-    embedding_weight = serializers.FloatField(default=0.5)
-    bm25_weight = serializers.FloatField(default=0.5)
-    context_window = serializers.IntegerField(default=3)
-    chunk_overlap = serializers.IntegerField(default=200)
-    num_k_rerank = serializers.IntegerField(default=5)
-    model_cohere_rerank = serializers.CharField(required=False, default="rerank-english-v2.0")
-    more_initial_chunks_for_reranking = serializers.IntegerField(default=20)
-    claude_context_model = serializers.CharField(required=False, default="claude-3-haiku-20240307")
-    gpt_temperature = serializers.FloatField(default=0)
-    id_modelo_do_usuario = serializers.IntegerField(required=True)
-class RagasSerializer(ResumoCursorCompeltoSerializer):
-    files = serializers.ListField(child=serializers.FileField(), required=True)
-    id_modelo_do_usuario = serializers.IntegerField(required=False)
-    hf_embedding = serializers.CharField(required=False, default="all-MiniLM-L6-v2")
-class RagasFromTextSerializer(ResumoCursorCompeltoSerializer):
-    files = None
-    id_modelo_do_usuario = serializers.IntegerField(required=False, default=9)
-    user_message = serializers.CharField(required=True)
-    context_provided = serializers.CharField(required=False)

     hf_embedding = serializers.CharField(required=False, default="all-MiniLM-L6-v2")
     chunk_size = serializers.IntegerField(required=False, default=1000)
     chunk_overlap = serializers.IntegerField(required=False, default=200)

resumos/views.py CHANGED Viewed

@@ -1,20 +1,11 @@
 from rest_framework.views import APIView
-from adrf.views import APIView as AsyncAPIView
 import tempfile, os
 from rest_framework.response import Response
-from _utils.resumo_completo_cursor import (
-    get_llm_summary_answer_by_cursor_complete,
-    test_ragas,
-)
 from _utils.resumo_simples_cursor import get_llm_summary_answer_by_cursor
 from _utils.utils import DEFAULT_SYSTEM_PROMPT
 from .serializer import (
-    RagasFromTextSerializer,
-    ResumoCursorCompeltoSerializer,
     ResumoPDFSerializer,
     ResumoCursorSerializer,
-    RagasSerializer,
 )
 from _utils.main import get_llm_answer_summary, get_llm_answer_summary_with_embedding
 from setup.environment import default_model
@@ -151,164 +142,3 @@ class ResumoSimplesCursorView(APIView):
                 os.remove(file)
             return Response({"resposta": resposta_llm})
-class ResumoSimplesCursorCompletoView(AsyncAPIView):
-    parser_classes = [MultiPartParser]
-    @extend_schema(
-        request=ResumoCursorCompeltoSerializer,
-    )
-    async def post(self, request):
-        serializer = ResumoCursorCompeltoSerializer(data=request.data)
-        if serializer.is_valid(raise_exception=True):
-            print("\n\n\n")
-            print("serializer.validated_data: ", serializer.validated_data)
-            print("\n\n\n")
-            listaPDFs = []
-            data = serializer.validated_data
-            print("\nserializer.validated_data: ", serializer.validated_data)
-            for file in serializer.validated_data["files"]:
-                file.seek(0)
-                with tempfile.NamedTemporaryFile(
-                    delete=False, suffix=".pdf"
-                ) as temp_file:  # Create a temporary file to save the uploaded PDF
-                    for (
-                        chunk
-                    ) in (
-                        file.chunks()
-                    ):  # Write the uploaded file content to the temporary file
-                        temp_file.write(chunk)
-                    temp_file_path = (
-                        temp_file.name
-                    )  # Get the path of the temporary file
-                    listaPDFs.append(temp_file_path)
-            print("listaPDFs: ", listaPDFs)
-            # resposta_llm = await get_llm_summary_answer_by_cursor_complete(
-            #     data, listaPDFs
-            # )
-            resposta_llm = await get_llm_summary_answer_by_cursor_complete(
-                data, listaPDFs
-            )
-            final = resposta_llm
-            print("\n\n\n")
-            print("final: ", final)
-            for file in listaPDFs:
-                os.remove(file)
-            return Response({"resposta": final})
-class RagasView(APIView):
-    parser_classes = [MultiPartParser]
-    @extend_schema(
-        request=RagasSerializer,
-    )
-    def post(self, request):
-        serializer = RagasSerializer(data=request.data)
-        print("\n\n\n")
-        print("\n\n\n")
-        print("serializer.data: ", serializer)
-        listaPDFs = []
-        if serializer.is_valid(raise_exception=True):
-            for file in serializer.validated_data["files"]:
-                file.seek(0)
-                with tempfile.NamedTemporaryFile(
-                    delete=False, suffix=".pdf"
-                ) as temp_file:  # Create a temporary file to save the uploaded PDF
-                    for (
-                        chunk
-                    ) in (
-                        file.chunks()
-                    ):  # Write the uploaded file content to the temporary file
-                        temp_file.write(chunk)
-                    temp_file_path = (
-                        temp_file.name
-                    )  # Get the path of the temporary file
-                    listaPDFs.append(temp_file_path)
-            result = test_ragas(serializer, listaPDFs)
-            for file in listaPDFs:
-                os.remove(file)
-            return Response({"msg": result})
-class RagasFromTextView(APIView):
-    def post(self, request):
-        serializer = RagasFromTextSerializer(data=request.data)
-        if serializer.is_valid(raise_exception=True):
-            from datasets import Dataset
-            from ragas import evaluate
-            from ragas.metrics import (
-                faithfulness,
-                answer_relevancy,
-                answer_correctness,
-                context_precision,
-                context_recall,
-            )
-            import os
-            from datasets import load_dataset
-            import pandas as pd
-            os.environ.get("OPENAI_API_KEY")
-            df_pandas = pd.read_csv(
-                "D:/repositorios/projetos-pessoais/projeto-y-backend-hugginf-face-teste-01/vella-backend/_utils/files/ragas_testset.csv"
-            )
-            # print(df_pandas["position"])  # Print a specific column
-            data = {
-                "user_input": [
-                    "What is the capital of France?",
-                ],
-                "response": [],
-                "retrieved_contexts": [],
-            }
-            reference = [
-                "Paris is the capital of France. It is a major European city known for its culture."
-            ]
-            for x in df_pandas["user_input"]:
-                data["user_input"].append(x)
-            for x in df_pandas["reference"]:
-                reference.append(x)
-            print("data: ", reference)
-            for i in range(len(reference)):
-                serializer.validated_data["user_message"] = data["user_input"][i]
-                resposta_llm = get_llm_summary_answer_by_cursor_complete(
-                    serializer.validated_data, contexto=reference[i]
-                )
-                data["response"].append(resposta_llm["texto_completo"])
-                lista_reference_contexts = []
-                for x in resposta_llm["resultado"]:
-                    lista_reference_contexts.append(x["source"]["text"])
-                data["retrieved_contexts"].append(lista_reference_contexts)
-            # Convert the data to a Hugging Face Dataset
-            dataset = Dataset.from_dict(data)
-            # Define the metrics you want to evaluate
-            metrics = [
-                faithfulness,
-                # answer_relevancy,
-                # answer_correctness,
-                # context_precision,
-                # context_recall,
-            ]
-            # Evaluate the dataset using the selected metrics
-            results = evaluate(dataset, metrics)
-            # results.to_pandas().to_csv("./result.csv")
-            return Response({"resposta": results.to_pandas().to_string()})

 from rest_framework.views import APIView
 import tempfile, os
 from rest_framework.response import Response
 from _utils.resumo_simples_cursor import get_llm_summary_answer_by_cursor
 from _utils.utils import DEFAULT_SYSTEM_PROMPT
 from .serializer import (
     ResumoPDFSerializer,
     ResumoCursorSerializer,
 )
 from _utils.main import get_llm_answer_summary, get_llm_answer_summary_with_embedding
 from setup.environment import default_model
                 os.remove(file)
             return Response({"resposta": resposta_llm})

setup/settings.py CHANGED Viewed

@@ -52,6 +52,7 @@ INSTALLED_APPS = [
     "resumos",
     "modelos_usuarios",
     "ragas_api",
 ]
 MIDDLEWARE = [

     "resumos",
     "modelos_usuarios",
     "ragas_api",
+    "gerar_relatorio_modelo_usuario",
 ]
 MIDDLEWARE = [

setup/urls.py CHANGED Viewed

@@ -4,11 +4,11 @@ from rest_framework import routers
 from drf_spectacular.views import SpectacularSwaggerView, SpectacularAPIView
 from pdfs.views import getPDF
 from resumos.views import (
     ResumoView,
     ResumoSimplesCursorView,
-    ResumoSimplesCursorCompletoView,
 )
 from ragas_api.views import RagasFromTextView, RagasView
 from modelos_usuarios.views import (
@@ -31,7 +31,7 @@ urlpatterns = [
     path("resumo", ResumoView.as_view(), name="summary-pdf"),
     path("resumo/cursor", ResumoSimplesCursorView.as_view(), name="summary-cursor-pdf"),
     path(
-        "resumo/cursor-completo",
         ResumoSimplesCursorCompletoView.as_view(),
         name="summary-cursor-completo-pdf",
     ),

 from drf_spectacular.views import SpectacularSwaggerView, SpectacularAPIView
+from gerar_relatorio_modelo_usuario.views import ResumoSimplesCursorCompletoView
 from pdfs.views import getPDF
 from resumos.views import (
     ResumoView,
     ResumoSimplesCursorView,
 )
 from ragas_api.views import RagasFromTextView, RagasView
 from modelos_usuarios.views import (
     path("resumo", ResumoView.as_view(), name="summary-pdf"),
     path("resumo/cursor", ResumoSimplesCursorView.as_view(), name="summary-cursor-pdf"),
     path(
+        "gerar-relatorio",
         ResumoSimplesCursorCompletoView.as_view(),
         name="summary-cursor-completo-pdf",
     ),