Spaces:

DHEIVER
/

Criminal.ai

Running

App Files Files Community

DHEIVER commited on Dec 27, 2024

Commit

7060ba3

verified ·

1 Parent(s): e6394a7

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -32

app.py CHANGED Viewed

@@ -10,48 +10,51 @@ logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 class DocumentGenerator:
-    """Gerencia a geração de documentos usando modelo público"""
     def __init__(self):
-        # Usando um Space público que está efetivamente disponível
         self.client = InferenceApi(
-            repo_id="bigscience/bloom",
             token=os.environ.get("HF_TOKEN")
         )
     def generate(self, doc_type: str, context: Dict[str, str]) -> str:
         """Gera o documento usando o modelo"""
         try:
-            prompt = f"""You are a Brazilian criminal lawyer. Create a {doc_type} in Portuguese following Brazilian legal standards.
-Information:
-Client: {context.get('client_name')}
-Process: {context.get('process_number')}
-Court: {context.get('court')}
-Jurisdiction: {context.get('jurisdiction')}
-Facts:
 {context.get('facts')}
-Legal Basis:
 {context.get('legal_basis')}
-Instructions:
-1. Use formal legal Portuguese
-2. Follow Brazilian legal document format
-3. Include all required sections
-4. Be precise and clear
-5. Keep proper legal formatting"""
-            response = self.client(
-                inputs=prompt,
-                parameters={
-                    "max_new_tokens": 2048,
-                    "temperature": 0.3,
-                    "top_p": 0.95,
-                    "repetition_penalty": 1.15,
-                    "do_sample": True
-                }
             )
             return self._format_output(response[0]["generated_text"])
@@ -65,19 +68,19 @@ Instructions:
         if not text:
             return "Erro: Nenhum texto gerado"
-        # Remove o prompt da resposta
-        text = text.split("Instructions:")[-1].strip()
         # Ajusta formatação
         lines = [line.strip() for line in text.split('\n') if line.strip()]
         formatted_text = '\n\n'.join(lines)
-        # Adiciona data atual
-        current_date = datetime.now().strftime('%d de %B de %Y')
         formatted_text = f"{formatted_text}\n\n{context.get('jurisdiction')}, {current_date}"
-        return formatted_text
 class WebInterface:
     """Interface Gradio para o gerador de documentos"""

 logger = logging.getLogger(__name__)
 class DocumentGenerator:
+    """Gerencia a geração de documentos usando BERT-PT"""
     def __init__(self):
+        # Usando modelo BERT português
         self.client = InferenceApi(
+            repo_id="neuralmind/bert-base-portuguese-legal-cased",
             token=os.environ.get("HF_TOKEN")
         )
     def generate(self, doc_type: str, context: Dict[str, str]) -> str:
         """Gera o documento usando o modelo"""
         try:
+            prompt = f"""[DOCUMENTO LEGAL]
+TIPO: {doc_type}
+[QUALIFICAÇÃO]
+CLIENTE: {context.get('client_name')}
+PROCESSO: {context.get('process_number')}
+TRIBUNAL: {context.get('court')}
+COMARCA: {context.get('jurisdiction')}
+[FATOS]
 {context.get('facts')}
+[FUNDAMENTOS]
 {context.get('legal_basis')}
+[INSTRUÇÕES]
+- Use linguagem jurídica formal
+- Siga formato brasileiro
+- Inclua todas as seções necessárias
+- Mantenha clareza e precisão
+- Use formatação adequada
+Gere o documento completo em português:"""
+            # Faz a chamada ao modelo
+            response = self.client.text_generation(
+                prompt,
+                max_new_tokens=1024,
+                do_sample=True,
+                temperature=0.2,
+                top_p=0.95,
+                num_return_sequences=1,
+                repetition_penalty=1.2
             )
             return self._format_output(response[0]["generated_text"])
         if not text:
             return "Erro: Nenhum texto gerado"
+        # Remove o prompt
+        text = text.split("Gere o documento completo em português:")[-1].strip()
         # Ajusta formatação
         lines = [line.strip() for line in text.split('\n') if line.strip()]
         formatted_text = '\n\n'.join(lines)
+        # Adiciona data
+        current_date = datetime.now().strftime('%d de %B de %Y').replace('May', 'Maio').replace('April', 'Abril')
         formatted_text = f"{formatted_text}\n\n{context.get('jurisdiction')}, {current_date}"
+        return formatted_text.strip()
 class WebInterface:
     """Interface Gradio para o gerador de documentos"""