Spaces:
Running
Running
from dataclasses import dataclass, field | |
from typing import List, Optional, Union | |
from rest_framework import serializers | |
from _utils.gerar_documento_utils.prompts import ( | |
prompt_gerar_documento, | |
) | |
from gerar_documento.serializer_base import ( | |
GerarDocumentoParametros, | |
GerarDocumentoParametrosData, | |
) | |
from setup.environment import default_model | |
from django.core.files.uploadedfile import UploadedFile | |
user_message = "What are the main points of this document?" | |
class GerarDocumentoInitialSerializer(serializers.Serializer): | |
files = serializers.ListField(child=serializers.FileField(), required=True) | |
user_message = serializers.CharField(required=False, default=user_message) | |
model = serializers.CharField(required=False, default=default_model) | |
hf_embedding = serializers.CharField(required=False, default="all-MiniLM-L6-v2") | |
chunk_size = serializers.IntegerField(required=False, default=3500) | |
chunk_overlap = serializers.IntegerField(required=False, default=800) | |
prompt_gerar_documento = serializers.CharField( | |
required=False, default=prompt_gerar_documento | |
) | |
prompt_gerar_documento_etapa_2 = serializers.CharField(required=False) | |
prompt_gerar_documento_etapa_3 = serializers.CharField(required=False) | |
model_cohere_rerank = serializers.CharField( | |
required=False, default="rerank-english-v2.0" | |
) | |
claude_context_model = serializers.CharField( | |
required=False, default="claude-3-haiku-20240307" | |
) | |
should_have_contextual_chunks = serializers.BooleanField(default=False) # type: ignore | |
should_use_llama_parse = serializers.BooleanField(required=False, default=False) # type: ignore | |
llm_ultimas_requests = serializers.CharField( | |
required=False, default="gemini-2.0-flash" | |
) | |
class GerarDocumentoInitialSerializerData: | |
files: List[dict] | |
user_message: str = "" | |
model: str = default_model | |
hf_embedding: str = "all-MiniLM-L6-v2" | |
chunk_size: int = 3500 | |
chunk_overlap: int = 800 | |
prompt_gerar_documento: str = "" | |
prompt_gerar_documento_etapa_2: Union[str, None] = None | |
prompt_gerar_documento_etapa_3: Union[str, None] = None | |
model_cohere_rerank: str = "rerank-english-v2.0" | |
claude_context_model: str = "claude-3-haiku-20240307" | |
should_have_contextual_chunks: bool = False | |
should_use_llama_parse: bool = False | |
llm_ultimas_requests: str = "gemini-2.0-flash" | |
class FileInfoSerializer(serializers.Serializer): | |
unique_id = serializers.CharField(max_length=255) | |
tipo_arquivo = serializers.CharField(max_length=255) | |
link_arquivo = serializers.URLField() | |
class FileInfoSerializerData: | |
unique_id: str | |
tipo_arquivo: str | |
link_arquivo: str | |
class GerarDocumentoSerializer( | |
GerarDocumentoInitialSerializer, GerarDocumentoParametros | |
): | |
files = serializers.ListField(child=FileInfoSerializer(), required=True) | |
bubble_editor_version = serializers.CharField( | |
required=False, default="version-test" | |
) # Será o valor utilizado dentro da URL da requisição pro Bubble | |
doc_id = serializers.CharField(required=True) | |
form_response_id = serializers.CharField(required=True) | |
version = serializers.CharField(required=True) | |
def get_obj(self): | |
return GerarDocumentoSerializerData(**self.validated_data) # type: ignore | |
class GerarDocumentoSerializerData( | |
GerarDocumentoParametrosData, GerarDocumentoInitialSerializerData | |
): | |
files: List[FileInfoSerializerData] | |
bubble_editor_version: str = "version-test" | |
doc_id: str = "" | |
form_response_id: str = "" | |
version: str = "" | |
class GerarDocumentoComPDFProprioSerializer( | |
GerarDocumentoInitialSerializer, GerarDocumentoParametros | |
): | |
def get_obj(self): | |
return GerarDocumentoSerializerData(**self.validated_data) # type: ignore | |
class GerarDocumentoComPDFProprioSerializerData( | |
GerarDocumentoParametrosData, GerarDocumentoInitialSerializerData | |
): | |
pass | |
class GerarEmentaSerializer(serializers.Serializer): | |
files = serializers.ListField(child=FileInfoSerializer(), required=True) | |
user_message = serializers.CharField(required=False, default="") | |
chunk_size = serializers.IntegerField(required=False, default=3500) | |
chunk_overlap = serializers.IntegerField(required=False, default=800) | |
bubble_editor_version = serializers.CharField( | |
required=False, default="version-test" | |
) # Será o valor utilizado dentro da URL da requisição pro Bubble | |
doc_id = serializers.CharField(required=True) | |
form_response_id = serializers.CharField(required=True) | |
version = serializers.CharField(required=True) | |