feat: enhance backend security and configuration

- Updated Dockerfile to improve security with a non-root user and added health checks.
- Modified docker-compose.yml to set containers as read-only, restrict ports to localhost, and implement health checks.
- Enhanced .env.example with additional environment variables for security and configuration.
- Improved FastAPI application with middleware for security headers, CORS, and body size limits.
- Refactored authentication flow in auth.py to include state validation and improved error handling.
- Added rate limiting to various endpoints to prevent abuse.
- Updated researcher and publication handling to ensure better validation and error management.
This commit is contained in:
Mireya Cueto Garrido
2026-05-08 11:19:52 +02:00
parent 96e58dbd16
commit af1b8e9956
37 changed files with 1375 additions and 282 deletions
+4
View File
@@ -1,3 +1,7 @@
from sqlalchemy.orm import declarative_base
# ---------------------------------------------------------
# Base de datos
# ---------------------------------------------------------
Base = declarative_base()
+9
View File
@@ -6,6 +6,9 @@ from datetime import datetime
from app.db.session import Base
# ---------------------------------------------------------
# Modelo de investigador
# ---------------------------------------------------------
class Researcher(Base):
__tablename__ = "researchers"
@@ -18,6 +21,9 @@ class Researcher(Base):
publications = relationship("Publication", back_populates="researcher", cascade="all, delete-orphan")
# ---------------------------------------------------------
# Modelo de publicación
# ---------------------------------------------------------
class Publication(Base):
__tablename__ = "publications"
@@ -65,6 +71,9 @@ class Publication(Base):
# Legacy: descargado global (deprecado). Mantener por compatibilidad de DB.
downloaded = Column(Boolean, nullable=False, default=False)
# ---------------------------------------------------------
# Modelo de descarga de publicación
# ---------------------------------------------------------
class PublicationDownload(Base):
"""
@@ -1,8 +1,16 @@
from sqlalchemy.orm import Session
from app.db.models import Publication
# ---------------------------------------------------------
# Repositorio de publicaciones
# ---------------------------------------------------------
class PublicationRepository:
# ---------------------------------------------------------
# Función auxiliar: obtener publicación por put_code
# ---------------------------------------------------------
@staticmethod
def get_by_put_code(db: Session, researcher_id: str, put_code: int):
"""
@@ -17,6 +25,10 @@ class PublicationRepository:
.first()
)
# ---------------------------------------------------------
# Función auxiliar: crear una nueva publicación
# ---------------------------------------------------------
@staticmethod
def create(db: Session, researcher_id: str, data: dict):
"""
@@ -37,6 +49,10 @@ class PublicationRepository:
db.refresh(pub)
return pub
# ---------------------------------------------------------
# Función auxiliar: actualizar una publicación existente
# ---------------------------------------------------------
@staticmethod
def update(db: Session, publication: Publication, data: dict):
"""
@@ -53,6 +69,10 @@ class PublicationRepository:
db.refresh(publication)
return publication
# ---------------------------------------------------------
# Función auxiliar: listar publicaciones de un investigador
# ---------------------------------------------------------
@staticmethod
def list_by_researcher(db: Session, researcher_id: str):
"""
@@ -2,13 +2,24 @@ from sqlalchemy.orm import Session
from app.db.models import Researcher
from sqlalchemy.sql import func
# ---------------------------------------------------------
# Repositorio de investigadores
# ---------------------------------------------------------
class ResearcherRepository:
# ---------------------------------------------------------
# Función auxiliar: obtener investigador por ORCID ID
# ---------------------------------------------------------
@staticmethod
def get_by_orcid(db: Session, orcid_id: str):
return db.query(Researcher).filter(Researcher.orcid_id == orcid_id).first()
# ---------------------------------------------------------
# Función auxiliar: crear un nuevo investigador
# ---------------------------------------------------------
@staticmethod
def create(db: Session, orcid_id: str, name: str = None):
researcher = Researcher(orcid_id=orcid_id, name=name)
@@ -17,6 +28,10 @@ class ResearcherRepository:
db.refresh(researcher)
return researcher
# ---------------------------------------------------------
# Función auxiliar: actualizar la última sincronización
# ---------------------------------------------------------
@staticmethod
def update_last_sync(db: Session, researcher: Researcher):
researcher.last_sync_at = func.now()
@@ -2,9 +2,16 @@ from sqlalchemy.orm import Session
from app.db.models import SyncJob
from sqlalchemy.sql import func
# ---------------------------------------------------------
# Repositorio de trabajos de sincronización
# ---------------------------------------------------------
class SyncJobRepository:
# ---------------------------------------------------------
# Función auxiliar: iniciar un nuevo trabajo de sincronización
# ---------------------------------------------------------
@staticmethod
def start_job(db: Session, researcher_id: str):
job = SyncJob(
@@ -17,6 +24,10 @@ class SyncJobRepository:
db.refresh(job)
return job
# ---------------------------------------------------------
# Función auxiliar: finalizar un trabajo de sincronización
# ---------------------------------------------------------
@staticmethod
def finish_job(db: Session, job: SyncJob, new_records: int, updated_records: int):
job.status = "finished"
+10
View File
@@ -9,6 +9,7 @@ load_dotenv()
# -----------------------------
# DATABASE URL
# -----------------------------
DATABASE_URL = os.getenv("DATABASE_URL")
engine = create_engine(
@@ -29,6 +30,7 @@ Base = declarative_base()
# -----------------------------
# DB SESSION DEPENDENCY
# -----------------------------
def get_db():
db = SessionLocal()
try:
@@ -40,17 +42,25 @@ def get_db():
# -----------------------------
# INIT DB (CREA TABLAS)
# -----------------------------
def init_db():
# Importa modelos para que SQLAlchemy los registre
import app.db.models # noqa
# Crea todas las tablas si no existen
Base.metadata.create_all(bind=engine)
# Pequeñas migraciones "best-effort" para entornos sin Alembic.
# (create_all no altera tablas existentes)
_ensure_columns()
# ---------------------------------------------------------
# Función auxiliar: asegurar columnas existentes
# ---------------------------------------------------------
def _ensure_columns():
insp = inspect(engine)