feat: translate comments, docstrings, and log messages to Spanish.

This commit is contained in:
Marco Gallegos
2025-12-18 12:33:39 -06:00
parent 519a5ad705
commit 3b9346fe0f
12 changed files with 205 additions and 205 deletions

View File

@@ -1,5 +1,5 @@
"""
Configuration loader for providers and keywords.
Cargador de configuración para proveedores y palabras clave.
"""
import csv
import os
@@ -8,43 +8,43 @@ from typing import List, Dict, Any
logger = logging.getLogger(__name__)
# Paths to configuration files
# Rutas a los archivos de configuración
BASE_DIR = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
PROVIDERS_PATH = os.path.join(BASE_DIR, 'config', 'providers.csv')
KEYWORDS_PATH = os.path.join(BASE_DIR, 'config', 'keywords.csv')
def load_providers() -> List[Dict[str, Any]]:
"""
Loads the providers configuration from CSV.
Carga la configuración de proveedores desde el archivo CSV.
"""
providers = []
if not os.path.exists(PROVIDERS_PATH):
logger.warning(f"Providers file not found at {PROVIDERS_PATH}")
logger.warning(f"Archivo de proveedores no encontrado en {PROVIDERS_PATH}")
return providers
try:
with open(PROVIDERS_PATH, mode='r', encoding='utf-8') as f:
reader = csv.DictReader(f)
for row in reader:
# Process aliases into a list
# Procesar alias en una lista
if 'aliases' in row and row['aliases']:
row['aliases'] = [a.strip().lower() for a in row['aliases'].split(',')]
else:
row['aliases'] = []
providers.append(row)
logger.info(f"Loaded {len(providers)} providers from {PROVIDERS_PATH}")
logger.info(f"Se cargaron {len(providers)} proveedores desde {PROVIDERS_PATH}")
except Exception as e:
logger.error(f"Error loading providers: {e}")
logger.error(f"Error al cargar proveedores: {e}")
return providers
def load_keywords() -> List[Dict[str, Any]]:
"""
Loads the keywords configuration from CSV.
Carga la configuración de palabras clave desde el archivo CSV.
"""
keywords = []
if not os.path.exists(KEYWORDS_PATH):
logger.warning(f"Keywords file not found at {KEYWORDS_PATH}")
logger.warning(f"Archivo de palabras clave no encontrado en {KEYWORDS_PATH}")
return keywords
try:
@@ -54,8 +54,8 @@ def load_keywords() -> List[Dict[str, Any]]:
if 'keyword' in row:
row['keyword'] = row['keyword'].strip().lower()
keywords.append(row)
logger.info(f"Loaded {len(keywords)} keywords from {KEYWORDS_PATH}")
logger.info(f"Se cargaron {len(keywords)} palabras clave desde {KEYWORDS_PATH}")
except Exception as e:
logger.error(f"Error loading keywords: {e}")
logger.error(f"Error al cargar palabras clave: {e}")
return keywords

View File

@@ -1,5 +1,5 @@
"""
Matching logic for providers and keywords.
Lógica de coincidencia para proveedores y palabras clave.
"""
import logging
from typing import Optional, Dict, Any
@@ -7,13 +7,13 @@ from app.preprocessing.config_loader import load_providers, load_keywords
logger = logging.getLogger(__name__)
# Global cache for configuration
# Caché global para la configuración
_PROVIDERS = None
_KEYWORDS = None
def get_config():
"""
Returns the loaded configuration, using cache if available.
Devuelve la configuración cargada, utilizando la caché si está disponible.
"""
global _PROVIDERS, _KEYWORDS
if _PROVIDERS is None:
@@ -24,7 +24,7 @@ def get_config():
def match_provider(description: str) -> Optional[Dict[str, Any]]:
"""
Searches for a provider name or alias in the description.
Busca un nombre de proveedor o alias en la descripción.
"""
providers, _ = get_config()
desc_lower = description.lower()
@@ -33,11 +33,11 @@ def match_provider(description: str) -> Optional[Dict[str, Any]]:
name = p.get('provider_name', '').lower()
aliases = p.get('aliases', [])
# Check name
# Verificar nombre
if name and name in desc_lower:
return p
# Check aliases
# Verificar alias
for alias in aliases:
if alias and alias in desc_lower:
return p
@@ -46,7 +46,7 @@ def match_provider(description: str) -> Optional[Dict[str, Any]]:
def match_keywords(description: str) -> Optional[Dict[str, Any]]:
"""
Searches for keywords in the description.
Busca palabras clave en la descripción.
"""
_, keywords = get_config()
desc_lower = description.lower()
@@ -60,13 +60,13 @@ def match_keywords(description: str) -> Optional[Dict[str, Any]]:
def get_metadata_from_match(description: str) -> Dict[str, Any]:
"""
Attempts to find metadata (category, subcategory, etc.) for a description.
Priority: Provider Match > Keyword Match.
Intenta encontrar metadatos (categoría, subcategoría, etc.) para una descripción.
Prioridad: Coincidencia de Proveedor > Coincidencia de Palabra Clave.
"""
# 1. Try Provider Match
# 1. Intentar coincidencia de proveedor
provider = match_provider(description)
if provider:
logger.info(f"Matched provider: {provider['provider_name']}")
logger.info(f"Proveedor coincidente: {provider['provider_name']}")
return {
"category": provider.get('categoria_principal'),
"subcategory": provider.get('subcategoria'),
@@ -75,10 +75,10 @@ def get_metadata_from_match(description: str) -> Dict[str, Any]:
"matched_name": provider['provider_name']
}
# 2. Try Keyword Match
# 2. Intentar coincidencia de palabra clave
keyword = match_keywords(description)
if keyword:
logger.info(f"Matched keyword: {keyword['keyword']}")
logger.info(f"Palabra clave coincidente: {keyword['keyword']}")
return {
"category": keyword.get('categoria_principal'),
"subcategory": keyword.get('subcategoria'),