diff --git a/diarios/admin.py b/diarios/admin.py index 96074c4..08af8ce 100644 --- a/diarios/admin.py +++ b/diarios/admin.py @@ -1,18 +1,13 @@ from django.contrib import admin -from .models import PDFDocument, DiarioOficial, TipoDiarioOficial from django.db import models - -@admin.register(PDFDocument) -class PDFDocumentAdmin(admin.ModelAdmin): - pass +from .models import DiarioOficial, TipoDiarioOficial @admin.register(DiarioOficial) class DiarioOficialAdmin(admin.ModelAdmin): pass - @admin.register(TipoDiarioOficial) class TipoDiarioOficialAdmin(admin.ModelAdmin): pass diff --git a/diarios/documents.py b/diarios/documents.py index e4f7fbb..21351a7 100644 --- a/diarios/documents.py +++ b/diarios/documents.py @@ -1,7 +1,9 @@ from django_elasticsearch_dsl import Document, fields from django_elasticsearch_dsl.registries import registry + from .models import DiarioOficial + @registry.register_document class DiarioOficialDocument(Document): tipo = fields.ObjectField(properties={ @@ -46,7 +48,6 @@ class DiarioOficialDocument(Document): 'lei, legislação, norma', 'processo, procedimento, autos', 'contrato, acordo, convênio', - # Adicione mais sinônimos relevantes para o contexto legal ] } }, diff --git a/diarios/migrations/0005_delete_pdfdocument.py b/diarios/migrations/0005_delete_pdfdocument.py new file mode 100644 index 0000000..0e0679e --- /dev/null +++ b/diarios/migrations/0005_delete_pdfdocument.py @@ -0,0 +1,16 @@ +# Generated by Django 5.0.12 on 2025-03-15 15:51 + +from django.db import migrations + + +class Migration(migrations.Migration): + + dependencies = [ + ("diarios", "0004_remove_diariooficial_finalizado_and_more"), + ] + + operations = [ + migrations.DeleteModel( + name="PDFDocument", + ), + ] diff --git a/diarios/models.py b/diarios/models.py index 1d013a4..1bdcfe8 100644 --- a/diarios/models.py +++ b/diarios/models.py @@ -1,43 +1,13 @@ -import requests +import json import os from urllib.parse import urlparse -from django.core.files.base import ContentFile -from django.db import models + import PyPDF2 -import json -from django.core.serializers.json import DjangoJSONEncoder +import requests from babel.dates import format_date - - -class PDFDocument(models.Model): - title = models.CharField(max_length=255) - file = models.FileField(upload_to="pdfs/") - content = models.TextField(blank=True) - uploaded_at = models.DateTimeField(auto_now_add=True) - page_content = models.TextField(blank=True) - - def __str__(self): - return self.title - - def save(self, *args, **kwargs): - if self.file: - pdf = PyPDF2.PdfReader(self.file) - texto = [] - pages_data = [] - - for i, pagina in enumerate(pdf.pages): - page_text = pagina.extract_text() - pages_data.append( - { - "number": i + 1, - "content": page_text, - } - ) - texto.append(pagina.extract_text()) - self.content = "\n".join(texto) - self.page_content = json.dumps(pages_data) - - super().save(*args, **kwargs) +from django.core.files.base import ContentFile +from django.core.serializers.json import DjangoJSONEncoder +from django.db import models class TipoDiarioOficial(models.Model): diff --git a/diarios/templates/diarios/diarios_search.html b/diarios/templates/diarios/diarios_search.html index 956643b..f2e91e6 100644 --- a/diarios/templates/diarios/diarios_search.html +++ b/diarios/templates/diarios/diarios_search.html @@ -3,20 +3,73 @@ {% block content %}