feat: AR-House initial commit

This commit is contained in:
2026-07-03 12:24:58 -04:00
commit 047c05287a
216 changed files with 127552 additions and 0 deletions
+13
View File
@@ -0,0 +1,13 @@
"""AR-House Location Intelligence Agent.
Investiga una dirección y genera un reporte completo de inteligencia de
ubicación para decisiones de inversión inmobiliaria.
Uso rápido:
from location_agent import run_location_agent
result = run_location_agent("1234 W 49th St, Hialeah FL 33012")
"""
from .agent import LocationAgent, run_location_agent
__all__ = ["LocationAgent", "run_location_agent"]
+195
View File
@@ -0,0 +1,195 @@
"""LocationAgent — Orquestador principal.
Flujo:
1. Geocode (Census → Nominatim fallback)
2. 7 sub-agentes en paralelo (ThreadPoolExecutor)
3. Calcular scores parciales y score general
4. Síntesis narrativa via Ollama
5. Guardar en SQLite
6. Exportar PDF
Uso:
from location_agent import run_location_agent
result = run_location_agent("1234 W 49th St, Hialeah FL 33012",
status_cb=print)
"""
from __future__ import annotations
import time
from concurrent.futures import ThreadPoolExecutor, as_completed
from typing import Callable, Optional
from .utils.geocoder import geocode
from .utils import ollama_client
from .sub_agents import (
crime_agent,
property_agent,
schools_agent,
amenities_agent,
demographics_agent,
maritime_agent,
lifestyle_agent,
)
from .report.report_generator import build_report
from .report.pdf_generator import export_pdf
from .db import save_report
SCORE_WEIGHTS = {
"crime": 0.20,
"property": 0.20,
"schools": 0.10,
"amenities": 0.15,
"demographics": 0.10,
"maritime": 0.15,
"lifestyle": 0.10,
}
def _emit(cb: Optional[Callable], msg: str) -> None:
if cb:
cb(msg)
class LocationAgent:
def __init__(self, status_cb: Optional[Callable[[str], None]] = None):
self.status_cb = status_cb
def analyze(self, address: str) -> dict:
"""Ejecuta el análisis completo para una dirección."""
t0 = time.perf_counter()
_emit(self.status_cb, f"🔍 Geocodificando: {address}")
# 1. Geocode
try:
geo = geocode(address)
except ValueError as e:
return {"error": str(e), "address": address}
lat = geo["lat"]
lon = geo["lon"]
_emit(self.status_cb, f"{geo['address']} | {geo['county']}, {geo['state']} | ({lat:.4f}, {lon:.4f})")
# 2. Sub-agentes en paralelo
_emit(self.status_cb, "🔄 Ejecutando sub-agentes en paralelo...")
sub_results = self._run_sub_agents(lat, lon, geo)
# 3. Calcular scores
scores = self._calculate_scores(sub_results)
overall = self._overall_score(scores)
_emit(self.status_cb, f" 📊 Score general: {overall}/100")
# 4. Síntesis Ollama
_emit(self.status_cb, "🤖 Generando análisis narrativo (Ollama)...")
narratives = self._build_narratives(sub_results, geo["address"])
exec_summary = ollama_client.executive_summary(scores, geo["address"], overall)
# 5. Construir reporte completo
report = build_report(
geo=geo,
sub_results=sub_results,
scores=scores,
overall_score=overall,
narratives=narratives,
exec_summary=exec_summary,
)
# 6. Guardar en SQLite
try:
report_id = save_report(geo, scores, overall, sub_results, report)
report["report_id"] = report_id
_emit(self.status_cb, f" 💾 Guardado en BD (id={report_id})")
except Exception as e:
_emit(self.status_cb, f" ⚠️ Error guardando en BD: {e}")
# 7. Exportar PDF
try:
pdf_path = export_pdf(report)
report["pdf_path"] = str(pdf_path)
_emit(self.status_cb, f" 📄 PDF: {pdf_path}")
except Exception as e:
_emit(self.status_cb, f" ⚠️ Error generando PDF: {e}")
report["pdf_path"] = None
report["duration_seconds"] = round(time.perf_counter() - t0, 2)
_emit(self.status_cb, f"✅ Análisis completo en {report['duration_seconds']}s")
return report
def _run_sub_agents(self, lat: float, lon: float, geo: dict) -> dict:
address = geo["address"]
county = geo.get("county", "")
state = geo.get("state", "FL")
tract = geo.get("tract_geoid", "")
state_fips = geo.get("state_fips", "")
county_fips = geo.get("county_fips", "")
tasks = {
"crime": lambda: crime_agent.run(lat, lon, address),
"property": lambda: property_agent.run(lat, lon, address, county),
"schools": lambda: schools_agent.run(lat, lon, address),
"amenities": lambda: amenities_agent.run(lat, lon, address),
"demographics": lambda: demographics_agent.run(
lat, lon, address, tract, state_fips, county_fips),
"maritime": lambda: maritime_agent.run(lat, lon, address, state),
"lifestyle": lambda: lifestyle_agent.run(lat, lon, address),
}
results = {}
with ThreadPoolExecutor(max_workers=7) as ex:
futures = {ex.submit(fn): name for name, fn in tasks.items()}
for future in as_completed(futures):
name = futures[future]
try:
results[name] = future.result()
_emit(self.status_cb, f"{name}")
except Exception as e:
results[name] = {"errors": [str(e)]}
_emit(self.status_cb, f" ⚠️ {name}: {e}")
return results
def _calculate_scores(self, sub_results: dict) -> dict:
score_fns = {
"crime": crime_agent.score,
"property": property_agent.score,
"schools": schools_agent.score,
"amenities": amenities_agent.score,
"demographics": demographics_agent.score,
"maritime": maritime_agent.score,
"lifestyle": lifestyle_agent.score,
}
scores = {}
for name, fn in score_fns.items():
try:
scores[name] = fn(sub_results.get(name, {}))
except Exception:
scores[name] = 50
return scores
def _overall_score(self, scores: dict) -> int:
total = sum(scores.get(k, 50) * w for k, w in SCORE_WEIGHTS.items())
return round(total)
def _build_narratives(self, sub_results: dict, address: str) -> dict:
section_names = {
"crime": "criminalidad",
"property": "valoración inmobiliaria",
"schools": "escuelas",
"amenities": "amenities y walkability",
"demographics": "demografía",
"maritime": "mercado laboral marítimo",
"lifestyle": "estilo de vida náutico",
}
narratives = {}
for key, section in section_names.items():
data = sub_results.get(key, {})
narratives[key] = ollama_client.analyze_section(data, section, address)
return narratives
def run_location_agent(
address: str,
status_cb: Optional[Callable[[str], None]] = None,
) -> dict:
"""Función de conveniencia para ejecutar el agente."""
return LocationAgent(status_cb=status_cb).analyze(address)
+119
View File
@@ -0,0 +1,119 @@
"""Persistencia SQLite para location_agent.
Usa ar_house.db existente del proyecto.
Crea la tabla location_reports si no existe.
"""
from __future__ import annotations
import json
import sqlite3
from pathlib import Path
_PROJECT_ROOT = Path(__file__).resolve().parent.parent
DB_PATH = _PROJECT_ROOT / "ar_house.db"
CREATE_SQL = """
CREATE TABLE IF NOT EXISTS location_reports (
id INTEGER PRIMARY KEY AUTOINCREMENT,
address TEXT NOT NULL,
lat REAL,
lon REAL,
score_general INTEGER,
score_crime INTEGER,
score_property INTEGER,
score_schools INTEGER,
score_amenities INTEGER,
score_demographics INTEGER,
score_maritime INTEGER,
score_lifestyle INTEGER,
raw_data TEXT,
report_text TEXT,
pdf_path TEXT,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
);
"""
def _conn() -> sqlite3.Connection:
conn = sqlite3.connect(DB_PATH)
conn.row_factory = sqlite3.Row
return conn
def init_db() -> None:
"""Crea la tabla si no existe."""
with _conn() as conn:
conn.execute(CREATE_SQL)
conn.commit()
def save_report(
geo: dict,
scores: dict,
overall_score: int,
raw_data: dict,
report: dict,
) -> int:
"""Guarda el reporte en SQLite. Devuelve el ID insertado."""
init_db()
pdf_path = report.get("pdf_path")
with _conn() as conn:
cur = conn.execute(
"""
INSERT INTO location_reports
(address, lat, lon, score_general,
score_crime, score_property, score_schools, score_amenities,
score_demographics, score_maritime, score_lifestyle,
raw_data, report_text, pdf_path)
VALUES (?,?,?,?,?,?,?,?,?,?,?,?,?,?)
""",
(
geo.get("address", ""),
geo.get("lat"),
geo.get("lon"),
overall_score,
scores.get("crime"),
scores.get("property"),
scores.get("schools"),
scores.get("amenities"),
scores.get("demographics"),
scores.get("maritime"),
scores.get("lifestyle"),
json.dumps(raw_data, ensure_ascii=False),
report.get("report_text", ""),
str(pdf_path) if pdf_path else None,
),
)
conn.commit()
return cur.lastrowid
def list_reports(limit: int = 50) -> list[dict]:
"""Lista los últimos reportes guardados."""
init_db()
with _conn() as conn:
rows = conn.execute(
"""SELECT id, address, score_general, created_at
FROM location_reports ORDER BY created_at DESC LIMIT ?""",
(limit,),
).fetchall()
return [dict(r) for r in rows]
def get_report(report_id: int) -> dict | None:
"""Obtiene un reporte completo por ID."""
init_db()
with _conn() as conn:
row = conn.execute(
"SELECT * FROM location_reports WHERE id=?", (report_id,)
).fetchone()
if not row:
return None
d = dict(row)
try:
d["raw_data"] = json.loads(d["raw_data"] or "{}")
except Exception:
pass
return d
+1
View File
@@ -0,0 +1 @@
"""Generadores de reporte para location_agent."""
+355
View File
@@ -0,0 +1,355 @@
"""Generador de PDF para location_agent.
Usa reportlab para generar PDF profesional.
Guarda en: analyses/location_reports/<fecha>_<dirección>.pdf
"""
from __future__ import annotations
import re
from datetime import datetime
from pathlib import Path
_PROJECT_ROOT = Path(__file__).resolve().parent.parent.parent
PDF_DIR = _PROJECT_ROOT / "analyses" / "location_reports"
def export_pdf(report: dict) -> Path:
"""Genera el PDF del reporte. Devuelve la ruta del archivo."""
try:
from reportlab.lib.pagesizes import letter
from reportlab.lib.styles import getSampleStyleSheet, ParagraphStyle
from reportlab.lib.units import inch
from reportlab.lib import colors
from reportlab.platypus import (
SimpleDocTemplate, Paragraph, Spacer, Table, TableStyle,
HRFlowable, PageBreak,
)
from reportlab.lib.enums import TA_CENTER, TA_LEFT
except ImportError:
raise ImportError("Instalar reportlab: pip install reportlab")
PDF_DIR.mkdir(parents=True, exist_ok=True)
# Nombre del archivo
safe_addr = re.sub(r"[^\w\s-]", "", report.get("address", "report"))[:60]
safe_addr = re.sub(r"\s+", "_", safe_addr.strip())
date_str = datetime.now().strftime("%Y%m%d_%H%M%S")
filename = PDF_DIR / f"{date_str}_{safe_addr}.pdf"
doc = SimpleDocTemplate(
str(filename),
pagesize=letter,
rightMargin=0.75 * inch,
leftMargin=0.75 * inch,
topMargin=0.75 * inch,
bottomMargin=0.75 * inch,
)
styles = getSampleStyleSheet()
# Estilos personalizados
title_style = ParagraphStyle("ARTitle", parent=styles["Title"],
fontSize=20, textColor=colors.HexColor("#1a2744"),
spaceAfter=6)
h1_style = ParagraphStyle("ARH1", parent=styles["Heading1"],
fontSize=14, textColor=colors.HexColor("#1a2744"),
spaceBefore=12, spaceAfter=6)
h2_style = ParagraphStyle("ARH2", parent=styles["Heading2"],
fontSize=11, textColor=colors.HexColor("#2d5a8e"))
body_style = ParagraphStyle("ARBody", parent=styles["Normal"],
fontSize=9, leading=13)
score_style = ParagraphStyle("ARScore", parent=styles["Normal"],
fontSize=28, textColor=colors.HexColor("#1a2744"),
alignment=TA_CENTER, fontName="Helvetica-Bold")
caption_style = ParagraphStyle("ARCaption", parent=styles["Normal"],
fontSize=8, textColor=colors.grey)
story = []
# --- PORTADA ---
story.append(Spacer(1, 0.5 * inch))
story.append(Paragraph("AR-HOUSE", title_style))
story.append(Paragraph("Location Intelligence Report", styles["Heading2"]))
story.append(HRFlowable(width="100%", thickness=2, color=colors.HexColor("#1a2744")))
story.append(Spacer(1, 0.2 * inch))
story.append(Paragraph(report.get("address", ""), h1_style))
story.append(Paragraph(f"Análisis: {report.get('analysis_date', '')}", caption_style))
story.append(Spacer(1, 0.3 * inch))
# Score general grande
overall = report.get("overall_score", 0)
score_color = _score_color(overall)
story.append(Paragraph(
f'<font color="{score_color}">{overall}/100</font>',
score_style,
))
story.append(Paragraph("Score General de Ubicación", styles["Normal"]))
story.append(Spacer(1, 0.3 * inch))
# Tabla de scores parciales
scores = report.get("scores", {})
score_labels = {
"crime": "Criminalidad",
"property": "Mercado Inmobiliario",
"schools": "Escuelas",
"amenities": "Amenities",
"demographics": "Demografía",
"maritime": "Mercado Marítimo",
"lifestyle": "Lifestyle Náutico",
}
tdata = [["Dimensión", "Score", "Peso"]]
for k, label in score_labels.items():
s = scores.get(k, 0)
w = int({"crime": 20, "property": 20, "schools": 10, "amenities": 15,
"demographics": 10, "maritime": 15, "lifestyle": 10}.get(k, 0))
tdata.append([label, f"{s}/100", f"{w}%"])
t = Table(tdata, colWidths=[3 * inch, 1.2 * inch, 0.8 * inch])
t.setStyle(TableStyle([
("BACKGROUND", (0, 0), (-1, 0), colors.HexColor("#1a2744")),
("TEXTCOLOR", (0, 0), (-1, 0), colors.white),
("FONTNAME", (0, 0), (-1, 0), "Helvetica-Bold"),
("FONTSIZE", (0, 0), (-1, -1), 9),
("ALIGN", (1, 0), (-1, -1), "CENTER"),
("ROWBACKGROUNDS", (0, 1), (-1, -1), [colors.white, colors.HexColor("#f5f7fa")]),
("GRID", (0, 0), (-1, -1), 0.5, colors.HexColor("#d0d0d0")),
("BOTTOMPADDING", (0, 0), (-1, -1), 5),
("TOPPADDING", (0, 0), (-1, -1), 5),
]))
story.append(t)
story.append(PageBreak())
# --- RESUMEN EJECUTIVO ---
exec_sec = report.get("sections", {}).get("executive", {})
story.append(Paragraph("1. Resumen Ejecutivo", h1_style))
story.append(HRFlowable(width="100%", thickness=1, color=colors.HexColor("#d0d0d0")))
if exec_sec.get("summary"):
story.append(Paragraph(exec_sec["summary"], body_style))
story.append(Spacer(1, 0.15 * inch))
if exec_sec.get("strengths"):
story.append(Paragraph("✅ Principales Fortalezas:", h2_style))
for s in exec_sec["strengths"]:
story.append(Paragraph(f"{s}", body_style))
if exec_sec.get("weaknesses"):
story.append(Spacer(1, 0.1 * inch))
story.append(Paragraph("⚠️ Principales Riesgos:", h2_style))
for w in exec_sec["weaknesses"]:
story.append(Paragraph(f"{w}", body_style))
story.append(PageBreak())
# --- SECCIONES ---
section_order = ["crime", "property", "schools", "amenities",
"demographics", "maritime", "lifestyle"]
section_nums = {k: i+2 for i, k in enumerate(section_order)}
for key in section_order:
sec = report.get("sections", {}).get(key, {})
num = section_nums[key]
score_val = sec.get("score", 0)
title = sec.get("title", key.title())
story.append(Paragraph(f"{num}. {title}", h1_style))
story.append(HRFlowable(width="100%", thickness=1, color=colors.HexColor("#d0d0d0")))
sc = sec.get("score")
if sc is not None:
clr = _score_color(sc)
story.append(Paragraph(
f'Score: <font color="{clr}"><b>{sc}/100</b></font>', body_style
))
# Datos clave por sección
_add_section_data(story, key, sec, body_style, h2_style)
# Narrativa
if sec.get("narrative"):
story.append(Spacer(1, 0.1 * inch))
story.append(Paragraph("Análisis:", h2_style))
story.append(Paragraph(sec["narrative"], body_style))
# Fuentes y errores
if sec.get("sources"):
story.append(Spacer(1, 0.05 * inch))
story.append(Paragraph(
f"<i>Fuentes: {', '.join(sec['sources'])}</i>", caption_style
))
if sec.get("errors"):
for err in sec["errors"]:
story.append(Paragraph(f"<i>⚠ {err}</i>", caption_style))
story.append(PageBreak())
# --- PIE DE PÁGINA ---
story.append(Paragraph("Datos Técnicos", h1_style))
story.append(Paragraph(
f"Generado por AR-House Location Intelligence Agent | {report.get('analysis_date', '')} | "
f"Coordenadas: {report.get('lat', '')}, {report.get('lon', '')}",
caption_style,
))
doc.build(story)
return filename
def _score_color(score: int) -> str:
if score >= 75:
return "#1a7a1a" # verde
elif score >= 50:
return "#e6a817" # amarillo
else:
return "#b83232" # rojo
def _add_section_data(story, key: str, sec: dict, body_style, h2_style) -> None:
"""Agrega datos específicos de cada sección al story del PDF."""
from reportlab.platypus import Paragraph, Spacer, Table, TableStyle
from reportlab.lib import colors
story.append(Spacer(1, 0.1 * inch if True else 0))
if key == "crime":
total = sec.get("total_crimes_30d", "N/A")
violent = "" if sec.get("has_violent") else "No"
story.append(Paragraph(f"Crímenes últimos 30 días: <b>{total}</b>", body_style))
story.append(Paragraph(f"Presencia de crimen violento: <b>{violent}</b>", body_style))
types = sec.get("crime_types", {})
if types:
story.append(Paragraph("Tipos de crimen:", h2_style))
for t, count in list(types.items())[:8]:
story.append(Paragraph(f"{t}: {count}", body_style))
elif key == "property":
fields = [
("Precio mediano listado", "median_list_price", "$"),
("Precio por sqft", "price_per_sqft", "$/sqft"),
("Apreciación 1 año", "appreciation_1y", "%"),
("Días en mercado (prom.)", "days_on_market", " días"),
("Inventario activo", "inventory", " propiedades"),
("Valor tasado condado", "county_assessed_value", "$"),
]
for label, field, unit in fields:
val = sec.get(field)
if val is not None:
if unit == "$":
display = f"${val:,}"
elif unit == "$/sqft":
display = f"${val:,}/sqft"
else:
display = f"{val}{unit}"
story.append(Paragraph(f"{label}: <b>{display}</b>", body_style))
elif key == "schools":
avg = sec.get("avg_rating")
if avg is not None:
story.append(Paragraph(f"Rating promedio de escuelas: <b>{avg}/10</b>", body_style))
for level, label in [("best_elementary", "Mejor primaria"),
("best_middle", "Mejor middle school"),
("best_high", "Mejor high school")]:
school = sec.get(level)
if school:
story.append(Paragraph(
f"{label}: <b>{school.get('name', 'N/A')}</b> (rating: {school.get('rating', 'N/A')}/10)",
body_style,
))
schools = sec.get("schools", [])[:8]
if schools:
tdata = [["Escuela", "Nivel", "Rating"]]
for s in schools:
tdata.append([s.get("name", "")[:35], s.get("level", ""), str(s.get("rating", "N/A"))])
t = Table(tdata, colWidths=[3.2 * inch, 1.2 * inch, 0.8 * inch])
t.setStyle(TableStyle([
("FONTNAME", (0, 0), (-1, 0), "Helvetica-Bold"),
("FONTSIZE", (0, 0), (-1, -1), 8),
("GRID", (0, 0), (-1, -1), 0.5, colors.HexColor("#d0d0d0")),
("ROWBACKGROUNDS", (0, 1), (-1, -1), [colors.white, colors.HexColor("#f5f7fa")]),
]))
story.append(t)
elif key == "amenities":
ws = sec.get("walk_score")
if ws is not None:
story.append(Paragraph(f"Walk Score estimado: <b>{ws}/100</b>", body_style))
nearest = sec.get("nearest", {})
cat_labels = {
"supermarket": "Supermercado más cercano",
"hospital": "Hospital/clínica más cercano",
"restaurant": "Restaurante más cercano",
"park": "Parque más cercano",
"gym": "Gimnasio más cercano",
}
for cat, label in cat_labels.items():
item = nearest.get(cat)
if item:
story.append(Paragraph(
f"{label}: <b>{item.get('name', 'N/A')}</b> ({item.get('dist_miles', '?')} mi)",
body_style,
))
elif key == "demographics":
income = sec.get("median_household_income")
if income:
story.append(Paragraph(f"Ingreso mediano del hogar: <b>${income:,}/año</b>", body_style))
age = sec.get("median_age")
if age:
story.append(Paragraph(f"Edad mediana: <b>{age} años</b>", body_style))
unemp = sec.get("unemployment_rate")
if unemp is not None:
story.append(Paragraph(f"Tasa de desempleo: <b>{unemp}%</b>", body_style))
edu = sec.get("education_bachelors_pct")
if edu is not None:
story.append(Paragraph(f"Con título universitario: <b>{edu}%</b>", body_style))
pop = sec.get("total_population")
if pop:
story.append(Paragraph(f"Población total del área: <b>{pop:,}</b>", body_style))
eth = sec.get("ethnicity", {})
if eth:
story.append(Paragraph("Distribución étnica:", h2_style))
for k, v in eth.items():
label = k.replace("_pct", "").replace("_", " ").title()
story.append(Paragraph(f"{label}: {v}%", body_style))
elif key == "maritime":
shipyards = sec.get("shipyards", [])
marinas = sec.get("marinas_with_jobs", [])
employers = sec.get("maritime_employers", [])
story.append(Paragraph(f"Astilleros encontrados: <b>{len(shipyards)}</b>", body_style))
story.append(Paragraph(f"Marinas encontradas: <b>{len(marinas)}</b>", body_style))
story.append(Paragraph(f"Empleadores portuarios: <b>{len(employers)}</b>", body_style))
bls = sec.get("bls_employment", {})
if bls.get("latest_employment"):
story.append(Paragraph(
f"Empleo marítimo en el estado: <b>{bls['latest_employment']}K empleados</b> "
f"({bls.get('year', '')})",
body_style,
))
elif key == "lifestyle":
nm = sec.get("nearest_marina")
if nm:
story.append(Paragraph(
f"Marina más cercana: <b>{nm.get('name', 'N/A')}</b> ({nm.get('dist_miles', '?')} mi)",
body_style,
))
nb = sec.get("nearest_beach")
if nb:
story.append(Paragraph(
f"Playa más cercana: <b>{nb.get('name', 'N/A')}</b> ({nb.get('dist_miles', '?')} mi)",
body_style,
))
story.append(Paragraph(
f"Acceso oceánico: <b>{'' if sec.get('ocean_access') else 'No'}</b>", body_style
))
story.append(Paragraph(
f"Vías fluviales cercanas: <b>{'' if sec.get('waterway_nearby') else 'No'}</b>",
body_style,
))
story.append(Paragraph(
f"Boat ramps en 10 millas: <b>{len(sec.get('boat_ramps', []))}</b>", body_style
))
from reportlab.lib.units import inch
story.append(Spacer(1, 0.1 * inch))
+167
View File
@@ -0,0 +1,167 @@
"""Generador del reporte de texto completo."""
from __future__ import annotations
from datetime import datetime
def build_report(
geo: dict,
sub_results: dict,
scores: dict,
overall_score: int,
narratives: dict,
exec_summary: dict,
) -> dict:
"""Construye el dict completo del reporte con todas las secciones."""
now = datetime.now()
report = {
"address": geo.get("address", ""),
"lat": geo.get("lat"),
"lon": geo.get("lon"),
"analysis_date": now.strftime("%Y-%m-%d %H:%M"),
"overall_score": overall_score,
"scores": scores,
"sections": {},
"exec_summary": exec_summary,
}
# Sección 1: Resumen ejecutivo (construido arriba)
report["sections"]["executive"] = {
"title": "Resumen Ejecutivo",
"score": overall_score,
"summary": exec_summary.get("summary", ""),
"strengths": exec_summary.get("strengths", []),
"weaknesses": exec_summary.get("weaknesses", []),
}
# Sección 2: Criminalidad
crime_data = sub_results.get("crime", {})
report["sections"]["crime"] = {
"title": "Criminalidad",
"score": scores.get("crime", 0),
"total_crimes_30d": crime_data.get("score_input", {}).get("total_crimes_30d", "N/A"),
"crime_types": crime_data.get("crime_types", {}),
"has_violent": crime_data.get("score_input", {}).get("has_violent", False),
"sources": crime_data.get("sources", []),
"errors": crime_data.get("errors", []),
"narrative": narratives.get("crime", ""),
}
# Sección 3: Valoración inmobiliaria
prop_data = sub_results.get("property", {})
report["sections"]["property"] = {
"title": "Valoración y Mercado Inmobiliario",
"score": scores.get("property", 0),
"estimated_value": prop_data.get("estimated_value"),
"price_per_sqft": prop_data.get("price_per_sqft"),
"appreciation_1y": prop_data.get("appreciation_1y"),
"appreciation_3y": prop_data.get("appreciation_3y"),
"days_on_market": prop_data.get("days_on_market"),
"median_list_price": prop_data.get("median_list_price"),
"inventory": prop_data.get("inventory"),
"county_assessed_value": prop_data.get("county_assessed_value"),
"sources": prop_data.get("sources", []),
"errors": prop_data.get("errors", []),
"narrative": narratives.get("property", ""),
}
# Sección 4: Escuelas
school_data = sub_results.get("schools", {})
report["sections"]["schools"] = {
"title": "Escuelas",
"score": scores.get("schools", 0),
"avg_rating": school_data.get("avg_rating"),
"schools": school_data.get("schools", []),
"best_elementary": school_data.get("best_elementary"),
"best_middle": school_data.get("best_middle"),
"best_high": school_data.get("best_high"),
"sources": school_data.get("sources", []),
"errors": school_data.get("errors", []),
"narrative": narratives.get("schools", ""),
}
# Sección 5: Amenities
amenity_data = sub_results.get("amenities", {})
report["sections"]["amenities"] = {
"title": "Amenities y Walkability",
"score": scores.get("amenities", 0),
"walk_score": amenity_data.get("walk_score_estimate"),
"total_amenities": amenity_data.get("total_amenities", 0),
"categories": amenity_data.get("categories", {}),
"nearest": amenity_data.get("nearest", {}),
"sources": amenity_data.get("sources", []),
"errors": amenity_data.get("errors", []),
"narrative": narratives.get("amenities", ""),
}
# Sección 6: Demografía
demo_data = sub_results.get("demographics", {})
report["sections"]["demographics"] = {
"title": "Demografía",
"score": scores.get("demographics", 0),
"median_household_income": demo_data.get("median_household_income"),
"median_age": demo_data.get("median_age"),
"unemployment_rate": demo_data.get("unemployment_rate"),
"education_bachelors_pct": demo_data.get("education_bachelors_pct"),
"ethnicity": demo_data.get("ethnicity", {}),
"total_population": demo_data.get("total_population"),
"sources": demo_data.get("sources", []),
"errors": demo_data.get("errors", []),
"narrative": narratives.get("demographics", ""),
}
# Sección 7: Mercado marítimo
maritime_data = sub_results.get("maritime", {})
report["sections"]["maritime"] = {
"title": "Mercado Laboral Marítimo",
"score": scores.get("maritime", 0),
"shipyards": maritime_data.get("shipyards", []),
"marinas_with_jobs": maritime_data.get("marinas_with_jobs", []),
"maritime_employers": maritime_data.get("maritime_employers", []),
"bls_employment": maritime_data.get("bls_employment", {}),
"sources": maritime_data.get("sources", []),
"errors": maritime_data.get("errors", []),
"narrative": narratives.get("maritime", ""),
}
# Sección 8: Lifestyle náutico
life_data = sub_results.get("lifestyle", {})
report["sections"]["lifestyle"] = {
"title": "Estilo de Vida Náutico",
"score": scores.get("lifestyle", 0),
"marinas": life_data.get("marinas", []),
"boat_ramps": life_data.get("boat_ramps", []),
"beaches": life_data.get("beaches", []),
"nearest_marina": life_data.get("nearest_marina"),
"nearest_beach": life_data.get("nearest_beach"),
"ocean_access": life_data.get("ocean_access", False),
"waterway_nearby": life_data.get("waterway_nearby", False),
"sources": life_data.get("sources", []),
"errors": life_data.get("errors", []),
"narrative": narratives.get("lifestyle", ""),
}
# Texto plano del reporte para guardar en BD
report["report_text"] = _build_text(report)
return report
def _build_text(report: dict) -> str:
lines = [
f"AR-HOUSE LOCATION INTELLIGENCE REPORT",
f"Dirección: {report['address']}",
f"Fecha: {report['analysis_date']}",
f"Score General: {report['overall_score']}/100",
"",
]
for key, sec in report["sections"].items():
lines.append(f"=== {sec['title'].upper()} ===")
if sec.get("score") is not None:
lines.append(f"Score: {sec['score']}/100")
if sec.get("narrative"):
lines.append(sec["narrative"])
lines.append("")
return "\n".join(lines)
+1
View File
@@ -0,0 +1 @@
"""Scrapers específicos para el módulo location_agent."""
+1
View File
@@ -0,0 +1 @@
"""Sub-agentes de investigación de ubicación."""
@@ -0,0 +1,158 @@
"""Sub-agente: Amenities y walkability.
Fuente: Overpass API (OpenStreetMap) — gratuita, sin key requerida.
"""
from __future__ import annotations
import math
import time
import requests
from data_fetchers.base import USER_AGENT
OVERPASS_URL = "https://overpass-api.de/api/interpreter"
CATEGORIES = {
"supermarket": ["supermarket", "grocery"],
"hospital": ["hospital", "clinic", "doctors", "pharmacy"],
"restaurant": ["restaurant", "fast_food", "cafe"],
"park": ["park"],
"gym": ["fitness_centre", "sports_centre"],
"school": ["school", "kindergarten"],
"bank": ["bank", "atm"],
"gas_station": ["fuel"],
}
def run(lat: float, lon: float, address: str) -> dict:
result = {
"categories": {},
"nearest": {},
"walk_score_estimate": None,
"total_amenities": 0,
"sources": ["OpenStreetMap/Overpass"],
"errors": [],
}
try:
amenities = _overpass_amenities(lat, lon)
result["categories"] = amenities["by_category"]
result["nearest"] = amenities["nearest"]
result["total_amenities"] = amenities["total"]
# Walk score estimado (basado en densidad de amenities en 1 milla)
result["walk_score_estimate"] = _estimate_walk_score(amenities)
except Exception as e:
result["errors"].append(f"Overpass amenities: {e}")
return result
def _overpass_amenities(lat: float, lon: float, radius_m: int = 3200) -> dict:
"""Consulta Overpass API para amenities en radio de ~2 millas."""
amenity_values = "|".join(
v for values in CATEGORIES.values() for v in values
)
query = f"""
[out:json][timeout:30];
(
node["amenity"~"{amenity_values}"](around:{radius_m},{lat},{lon});
);
out body;
"""
time.sleep(1)
r = requests.post(OVERPASS_URL, data={"data": query},
headers={"User-Agent": USER_AGENT}, timeout=35)
r.raise_for_status()
elements = r.json().get("elements", [])
by_category: dict = {cat: [] for cat in CATEGORIES}
nearest: dict = {}
for el in elements:
tags = el.get("tags", {})
amenity = tags.get("amenity", "")
name = tags.get("name", amenity)
el_lat = el.get("lat", lat)
el_lon = el.get("lon", lon)
dist = _haversine(lat, lon, el_lat, el_lon)
for cat, values in CATEGORIES.items():
if amenity in values:
by_category[cat].append({"name": name, "dist_miles": round(dist, 2)})
if cat not in nearest or dist < nearest[cat]["dist_miles"]:
nearest[cat] = {"name": name, "dist_miles": round(dist, 2)}
break
# Ordenar por distancia
for cat in by_category:
by_category[cat].sort(key=lambda x: x["dist_miles"])
by_category[cat] = by_category[cat][:5]
total = sum(len(v) for v in by_category.values())
return {"by_category": by_category, "nearest": nearest, "total": total}
def _haversine(lat1: float, lon1: float, lat2: float, lon2: float) -> float:
"""Distancia en millas entre dos coordenadas."""
R = 3958.8 # radio Tierra en millas
dlat = math.radians(lat2 - lat1)
dlon = math.radians(lon2 - lon1)
a = math.sin(dlat/2)**2 + math.cos(math.radians(lat1)) * math.cos(math.radians(lat2)) * math.sin(dlon/2)**2
return R * 2 * math.asin(math.sqrt(a))
def _estimate_walk_score(amenities: dict) -> int:
"""Estima walk score 0-100 basado en densidad y diversidad de amenities."""
cats = amenities["by_category"]
nearest = amenities["nearest"]
score = 0
# Puntos por cercanía de supermercado (más importante)
sup = nearest.get("supermarket", {}).get("dist_miles", 99)
if sup <= 0.25:
score += 25
elif sup <= 0.5:
score += 18
elif sup <= 1.0:
score += 10
elif sup <= 2.0:
score += 5
# Restaurantes/cafes cercanos
rest_count = len([x for x in cats.get("restaurant", []) if x["dist_miles"] <= 1.0])
score += min(20, rest_count * 3)
# Diversidad de categorías con algo en <= 1 milla
cats_nearby = sum(
1 for cat, items in cats.items()
if any(x["dist_miles"] <= 1.0 for x in items)
)
score += cats_nearby * 5
# Hospitales
hosp = nearest.get("hospital", {}).get("dist_miles", 99)
if hosp <= 2.0:
score += 10
return min(100, max(0, score))
def score(data: dict) -> int:
"""Score 0-100 de amenities."""
ws = data.get("walk_score_estimate")
if ws is not None:
return ws
total = data.get("total_amenities", 0)
if total >= 50:
return 85
elif total >= 30:
return 70
elif total >= 15:
return 55
elif total >= 5:
return 40
return 25
+124
View File
@@ -0,0 +1,124 @@
"""Sub-agente: Criminalidad.
Fuentes: SpotCrime (scraping) + FBI UCR API (key opcional).
Retorna datos fail-soft — si falla, devuelve dict vacío con error.
"""
from __future__ import annotations
import os
import time
import requests
from bs4 import BeautifulSoup
from data_fetchers.base import USER_AGENT, DEFAULT_TIMEOUT
FBI_API_KEY = os.getenv("FBI_UCR_API_KEY", "")
FBI_BASE = "https://api.usa.gov/crime/fbi/cde"
def run(lat: float, lon: float, address: str) -> dict:
"""Recopila datos de criminalidad para la ubicación."""
result = {
"score_input": {},
"crimes_recent": [],
"crime_types": {},
"trend": "desconocido",
"sources": [],
"errors": [],
}
# --- SpotCrime scraping ---
try:
spot = _spotcrime(lat, lon)
result["crimes_recent"] = spot.get("crimes", [])
result["crime_types"] = spot.get("by_type", {})
result["sources"].append("SpotCrime.com")
except Exception as e:
result["errors"].append(f"SpotCrime: {e}")
# --- FBI UCR API (solo si hay key) ---
if FBI_API_KEY:
try:
fbi = _fbi_ucr(address)
result["fbi_data"] = fbi
result["sources"].append("FBI UCR API")
except Exception as e:
result["errors"].append(f"FBI UCR: {e}")
# Score input: cantidad de crímenes en los últimos 30 días
total = len(result["crimes_recent"])
result["score_input"]["total_crimes_30d"] = total
result["score_input"]["has_violent"] = any(
c.get("type", "").lower() in ("assault", "robbery", "shooting", "homicide")
for c in result["crimes_recent"]
)
return result
def _spotcrime(lat: float, lon: float) -> dict:
"""Scraping básico de SpotCrime para el área."""
url = f"https://spotcrime.com/crimes.json?lat={lat}&lon={lon}&callback=spotcrime"
headers = {"User-Agent": USER_AGENT, "Referer": "https://spotcrime.com"}
time.sleep(2)
r = requests.get(url, headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
# SpotCrime devuelve JSONP — extraer JSON interior
text = r.text
if text.startswith("spotcrime("):
text = text[len("spotcrime("):-1]
import json
data = json.loads(text)
crimes = data.get("crimes", [])
by_type: dict = {}
for c in crimes:
t = c.get("type", "Other")
by_type[t] = by_type.get(t, 0) + 1
return {"crimes": crimes[:50], "by_type": by_type}
def _fbi_ucr(address: str) -> dict:
"""FBI UCR API — estadísticas por estado/ciudad."""
# Extraer estado de la dirección (últimas 2 letras antes del ZIP)
import re
m = re.search(r",\s*([A-Z]{2})\s+\d{5}", address.upper())
state = m.group(1) if m else "FL"
url = f"{FBI_BASE}/summarized/state/{state}/all?API_KEY={FBI_API_KEY}&from=2020&to=2023"
r = requests.get(url, timeout=DEFAULT_TIMEOUT, headers={"User-Agent": USER_AGENT})
r.raise_for_status()
return r.json()
def score(data: dict) -> int:
"""Calcula score 0-100 de seguridad (100 = muy seguro)."""
if not data or not data.get("score_input"):
return 50 # neutral si no hay datos
total = data["score_input"].get("total_crimes_30d", 0)
has_violent = data["score_input"].get("has_violent", False)
# Base score inversamente proporcional a crímenes
if total == 0:
base = 90
elif total <= 5:
base = 75
elif total <= 15:
base = 60
elif total <= 30:
base = 45
elif total <= 50:
base = 30
else:
base = 15
# Penalización por crimen violento
if has_violent:
base = max(0, base - 15)
return min(100, max(0, base))
@@ -0,0 +1,205 @@
"""Sub-agente: Demografía.
Fuente: Census ACS API (key gratuita en api.census.gov/data/key_signup.html).
Sin key, usa datos estimados por ZIP desde datos públicos del Census.
"""
from __future__ import annotations
import os
import re
import time
import requests
from data_fetchers.base import USER_AGENT, DEFAULT_TIMEOUT
CENSUS_KEY = os.getenv("CENSUS_API_KEY", "")
ACS_BASE = "https://api.census.gov/data/2022/acs/acs5"
# Variables ACS5 a consultar
ACS_VARS = {
"B19013_001E": "median_household_income",
"B01002_001E": "median_age",
"B23025_005E": "unemployed",
"B23025_002E": "labor_force",
"B15003_022E": "bachelors_degree",
"B15003_001E": "population_25plus",
"B03002_003E": "white_non_hispanic",
"B03002_004E": "black",
"B03002_012E": "hispanic",
"B03002_006E": "asian",
"B01003_001E": "total_population",
}
def run(lat: float, lon: float, address: str, tract_geoid: str = "",
state_fips: str = "", county_fips: str = "") -> dict:
result = {
"median_household_income": None,
"median_age": None,
"unemployment_rate": None,
"education_bachelors_pct": None,
"ethnicity": {},
"total_population": None,
"sources": [],
"errors": [],
}
# Extraer ZIP para fallback
zip_m = re.search(r"\b(\d{5})\b", address)
zip_code = zip_m.group(1) if zip_m else ""
# --- Census ACS API ---
if CENSUS_KEY and state_fips and county_fips:
try:
acs = _census_acs(state_fips, county_fips, tract_geoid)
result.update(acs)
result["sources"].append("Census ACS 5-Year")
except Exception as e:
result["errors"].append(f"Census ACS: {e}")
else:
result["errors"].append(
"Census API key no configurada. Agregar CENSUS_API_KEY en .env. "
"Obtener en: https://api.census.gov/data/key_signup.html"
)
# --- Fallback: Census ZIP (sin key) ---
if not result["sources"] and zip_code:
try:
z = _census_zip_no_key(zip_code)
result.update(z)
result["sources"].append("Census ZIP (estimado)")
except Exception as e:
result["errors"].append(f"Census ZIP fallback: {e}")
return result
def _census_acs(state_fips: str, county_fips: str, tract_geoid: str) -> dict:
"""Consulta Census ACS 5-Year para un census tract."""
vars_str = ",".join(ACS_VARS.keys())
# Extraer county y tract de GEOID (12 dígitos: SS+CCC+TTTTTT)
county = county_fips[-3:] if len(county_fips) >= 3 else county_fips
state = state_fips[:2]
tract = tract_geoid[-6:] if len(tract_geoid) >= 6 else "*"
params = {
"get": vars_str,
"for": f"tract:{tract}",
"in": f"state:{state} county:{county}",
"key": CENSUS_KEY,
}
headers = {"User-Agent": USER_AGENT}
time.sleep(0.5)
r = requests.get(ACS_BASE, params=params, headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
rows = r.json()
if len(rows) < 2:
return {}
header = rows[0]
vals = rows[1]
data = {ACS_VARS.get(h, h): _safe_int(v) for h, v in zip(header, vals) if h in ACS_VARS}
return _process_acs(data)
def _census_zip_no_key(zip_code: str) -> dict:
"""Census sin key — datos por ZIP usando endpoint público."""
vars_str = "B19013_001E,B01002_001E,B01003_001E"
params = {"get": vars_str, "for": f"zip code tabulation area:{zip_code}"}
r = requests.get(ACS_BASE, params=params,
headers={"User-Agent": USER_AGENT}, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
rows = r.json()
if len(rows) < 2:
return {}
header = rows[0]
vals = rows[1]
raw = dict(zip(header, vals))
return {
"median_household_income": _safe_int(raw.get("B19013_001E")),
"median_age": _safe_int(raw.get("B01002_001E")),
"total_population": _safe_int(raw.get("B01003_001E")),
}
def _process_acs(data: dict) -> dict:
total_pop = data.get("total_population") or 1
labor = data.get("labor_force") or 1
pop25 = data.get("population_25plus") or 1
unemployed = data.get("unemployed") or 0
bachelors = data.get("bachelors_degree") or 0
white = data.get("white_non_hispanic") or 0
black = data.get("black") or 0
hispanic = data.get("hispanic") or 0
asian = data.get("asian") or 0
ethnicity = {
"white_non_hispanic_pct": round(white / total_pop * 100, 1),
"black_pct": round(black / total_pop * 100, 1),
"hispanic_pct": round(hispanic / total_pop * 100, 1),
"asian_pct": round(asian / total_pop * 100, 1),
"other_pct": max(0, round((total_pop - white - black - hispanic - asian) / total_pop * 100, 1)),
}
return {
"median_household_income": data.get("median_household_income"),
"median_age": data.get("median_age"),
"unemployment_rate": round(unemployed / labor * 100, 1) if labor > 0 else None,
"education_bachelors_pct": round(bachelors / pop25 * 100, 1) if pop25 > 0 else None,
"ethnicity": ethnicity,
"total_population": total_pop,
}
def _safe_int(v) -> int | None:
try:
return int(v)
except (TypeError, ValueError):
return None
def score(data: dict) -> int:
"""Score 0-100 basado en indicadores socioeconómicos."""
s = 50
income = data.get("median_household_income")
if income is not None:
if income >= 100000:
s += 20
elif income >= 75000:
s += 12
elif income >= 50000:
s += 5
elif income >= 35000:
s -= 5
else:
s -= 15
unemp = data.get("unemployment_rate")
if unemp is not None:
if unemp <= 3:
s += 15
elif unemp <= 5:
s += 8
elif unemp <= 8:
s += 0
elif unemp <= 12:
s -= 8
else:
s -= 15
edu = data.get("education_bachelors_pct")
if edu is not None:
if edu >= 50:
s += 10
elif edu >= 35:
s += 5
elif edu >= 20:
s += 0
else:
s -= 5
return min(100, max(0, s))
@@ -0,0 +1,160 @@
"""Sub-agente: Estilo de vida náutico.
Fuentes: Overpass API (marinas, boat ramps, playas, acceso al agua).
"""
from __future__ import annotations
import math
import time
import requests
from data_fetchers.base import USER_AGENT
OVERPASS_URL = "https://overpass-api.de/api/interpreter"
def run(lat: float, lon: float, address: str) -> dict:
result = {
"marinas": [],
"boat_ramps": [],
"beaches": [],
"nearest_marina": None,
"nearest_beach": None,
"nearest_boat_ramp": None,
"ocean_access": False,
"waterway_nearby": False,
"sources": ["OpenStreetMap/Overpass"],
"errors": [],
}
try:
data = _overpass_nautical(lat, lon)
result.update(data)
except Exception as e:
result["errors"].append(f"Overpass lifestyle: {e}")
return result
def _overpass_nautical(lat: float, lon: float, radius_m: int = 16000) -> dict:
"""Consulta amenidades náuticas en radio de ~10 millas."""
query = f"""
[out:json][timeout:35];
(
node["leisure"="marina"](around:{radius_m},{lat},{lon});
way["leisure"="marina"](around:{radius_m},{lat},{lon});
node["leisure"="slipway"](around:{radius_m},{lat},{lon});
way["leisure"="slipway"](around:{radius_m},{lat},{lon});
node["natural"="beach"](around:{radius_m},{lat},{lon});
way["natural"="beach"](around:{radius_m},{lat},{lon});
node["waterway"="river"](around:3200,{lat},{lon});
node["natural"="water"](around:3200,{lat},{lon});
way["natural"="coastline"](around:8000,{lat},{lon});
);
out body center;
"""
time.sleep(1)
r = requests.post(OVERPASS_URL, data={"data": query},
headers={"User-Agent": USER_AGENT}, timeout=40)
r.raise_for_status()
elements = r.json().get("elements", [])
marinas, boat_ramps, beaches = [], [], []
waterway_nearby = False
ocean_access = False
for el in elements:
tags = el.get("tags", {})
name = tags.get("name", "Sin nombre")
# Obtener coords
if "center" in el:
el_lat = el["center"]["lat"]
el_lon = el["center"]["lon"]
else:
el_lat = el.get("lat", lat)
el_lon = el.get("lon", lon)
dist = _haversine(lat, lon, el_lat, el_lon)
leisure = tags.get("leisure", "")
natural = tags.get("natural", "")
waterway = tags.get("waterway", "")
if leisure == "marina":
entry = {
"name": name,
"dist_miles": round(dist, 2),
"fuel": tags.get("fuel", "unknown"),
"pump_out": tags.get("pump_out", "unknown"),
"depth": tags.get("maxdraught", tags.get("depth", "unknown")),
}
marinas.append(entry)
elif leisure == "slipway":
boat_ramps.append({"name": name, "dist_miles": round(dist, 2)})
elif natural == "beach":
beaches.append({"name": name, "dist_miles": round(dist, 2)})
elif natural == "coastline":
ocean_access = True
elif waterway in ("river", "canal") or natural in ("water", "bay"):
waterway_nearby = True
marinas.sort(key=lambda x: x["dist_miles"])
boat_ramps.sort(key=lambda x: x["dist_miles"])
beaches.sort(key=lambda x: x["dist_miles"])
return {
"marinas": marinas[:10],
"boat_ramps": boat_ramps[:10],
"beaches": beaches[:10],
"nearest_marina": marinas[0] if marinas else None,
"nearest_beach": beaches[0] if beaches else None,
"nearest_boat_ramp": boat_ramps[0] if boat_ramps else None,
"ocean_access": ocean_access,
"waterway_nearby": waterway_nearby,
}
def _haversine(lat1: float, lon1: float, lat2: float, lon2: float) -> float:
R = 3958.8
dlat = math.radians(lat2 - lat1)
dlon = math.radians(lon2 - lon1)
a = math.sin(dlat/2)**2 + math.cos(math.radians(lat1)) * math.cos(math.radians(lat2)) * math.sin(dlon/2)**2
return R * 2 * math.asin(math.sqrt(a))
def score(data: dict) -> int:
"""Score 0-100 para lifestyle náutico."""
s = 30 # base
nearest_marina = data.get("nearest_marina")
if nearest_marina:
d = nearest_marina["dist_miles"]
if d <= 1:
s += 30
elif d <= 3:
s += 20
elif d <= 5:
s += 12
elif d <= 10:
s += 6
nearest_beach = data.get("nearest_beach")
if nearest_beach:
d = nearest_beach["dist_miles"]
if d <= 1:
s += 20
elif d <= 3:
s += 12
elif d <= 5:
s += 6
if data.get("ocean_access"):
s += 10
if data.get("waterway_nearby"):
s += 5
boat_ramps = len(data.get("boat_ramps", []))
s += min(10, boat_ramps * 2)
return min(100, max(0, s))
+151
View File
@@ -0,0 +1,151 @@
"""Sub-agente: Mercado laboral marítimo.
Fuentes: BLS.gov API (gratuita) + Overpass para instalaciones físicas.
"""
from __future__ import annotations
import time
import requests
from data_fetchers.base import USER_AGENT, DEFAULT_TIMEOUT
OVERPASS_URL = "https://overpass-api.de/api/interpreter"
BLS_BASE = "https://api.bls.gov/publicAPI/v2/timeseries/data/"
# NAICS codes marítimos para BLS
MARITIME_NAICS = {
"483": "Water Transportation",
"4883": "Support Activities for Water Transportation",
"3366": "Ship & Boat Building",
"114": "Fishing, Hunting and Trapping",
}
def run(lat: float, lon: float, address: str, state: str = "FL") -> dict:
result = {
"maritime_employers": [],
"shipyards": [],
"marinas_with_jobs": [],
"bls_employment": {},
"maritime_presence_score": 0,
"sources": [],
"errors": [],
}
# --- Overpass: instalaciones marítimas físicas ---
try:
facilities = _overpass_maritime(lat, lon)
result["shipyards"] = facilities.get("shipyards", [])
result["marinas_with_jobs"] = facilities.get("marinas", [])
result["maritime_employers"] = facilities.get("employers", [])
result["sources"].append("OpenStreetMap/Overpass")
except Exception as e:
result["errors"].append(f"Overpass maritime: {e}")
# --- BLS API (sin key — API v1 gratuita, limitada) ---
try:
bls = _bls_maritime(state)
result["bls_employment"] = bls
result["sources"].append("BLS.gov")
except Exception as e:
result["errors"].append(f"BLS: {e}")
# Presencia marítima general
result["maritime_presence_score"] = (
len(result["shipyards"]) * 15 +
len(result["marinas_with_jobs"]) * 8 +
len(result["maritime_employers"]) * 5
)
return result
def _overpass_maritime(lat: float, lon: float, radius_m: int = 16000) -> dict:
"""Instalaciones marítimas en radio de ~10 millas."""
query = f"""
[out:json][timeout:30];
(
node["industrial"="port"](around:{radius_m},{lat},{lon});
node["waterway"="boatyard"](around:{radius_m},{lat},{lon});
node["leisure"="marina"](around:{radius_m},{lat},{lon});
way["leisure"="marina"](around:{radius_m},{lat},{lon});
node["man_made"="shipyard"](around:{radius_m},{lat},{lon});
node["seamark:type"="harbour"](around:{radius_m},{lat},{lon});
);
out body center;
"""
time.sleep(1)
r = requests.post(OVERPASS_URL, data={"data": query},
headers={"User-Agent": USER_AGENT}, timeout=35)
r.raise_for_status()
elements = r.json().get("elements", [])
shipyards, marinas, employers = [], [], []
for el in elements:
tags = el.get("tags", {})
name = tags.get("name", "Sin nombre")
industrial = tags.get("industrial", "")
waterway = tags.get("waterway", "")
leisure = tags.get("leisure", "")
man_made = tags.get("man_made", "")
if man_made == "shipyard" or waterway == "boatyard":
shipyards.append({"name": name, "type": "shipyard"})
elif leisure == "marina":
marinas.append({"name": name, "type": "marina"})
elif industrial == "port":
employers.append({"name": name, "type": "port"})
return {"shipyards": shipyards[:10], "marinas": marinas[:10], "employers": employers[:10]}
def _bls_maritime(state: str) -> dict:
"""BLS API v1 — empleo en water transportation por estado."""
# Series ID formato: SMU{state_fips}0000004830000001 (Water Transportation)
# Sin key usamos endpoint público v1
series_id = f"SMU120000004830000001" # Florida como default
payload = {
"seriesid": [series_id],
"startyear": "2022",
"endyear": "2024",
}
headers = {"User-Agent": USER_AGENT, "Content-Type": "application/json"}
import json
r = requests.post(BLS_BASE, data=json.dumps(payload),
headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
data = r.json()
series = data.get("Results", {}).get("series", [])
if not series:
return {}
latest = series[0].get("data", [])
if not latest:
return {}
return {
"series_id": series_id,
"latest_employment": latest[0].get("value"),
"period": latest[0].get("period"),
"year": latest[0].get("year"),
"label": "Water Transportation Employment (thousands)",
}
def score(data: dict) -> int:
"""Score 0-100 para mercado laboral marítimo."""
presence = data.get("maritime_presence_score", 0)
if presence >= 60:
return 90
elif presence >= 40:
return 75
elif presence >= 20:
return 60
elif presence >= 10:
return 45
elif presence > 0:
return 35
else:
return 20
+279
View File
@@ -0,0 +1,279 @@
"""Sub-agente: Valoración y mercado inmobiliario.
Fuentes: Zillow (scraping) + County Property Appraiser oficial de Florida.
Soporta todos los condados principales de Florida — se selecciona
automáticamente según el condado geocodificado.
"""
from __future__ import annotations
import re
import sys
import time
from pathlib import Path
import requests
from bs4 import BeautifulSoup
from data_fetchers.base import USER_AGENT, DEFAULT_TIMEOUT
_PROJECT_ROOT = Path(__file__).resolve().parent.parent.parent
if str(_PROJECT_ROOT) not in sys.path:
sys.path.insert(0, str(_PROJECT_ROOT))
# ── Mapa de condados → fetcher / sitio PA oficial ────────────────────────────
# Clave: fragmento del nombre del condado en minúsculas (como devuelve el geocoder)
# Valor: dict con 'fetcher' (función importable) o 'url' (sitio web PA para display)
COUNTY_PA_MAP = {
# Condados con fetcher dedicado en data_fetchers/
"broward": {"fetcher": "data_fetchers.pa_broward:fetch_pa_broward",
"name": "Broward County PA", "site": "https://bcpa.net"},
"miami-dade": {"fetcher": "data_fetchers.pa_miami_dade:fetch_pa_miami_dade",
"name": "Miami-Dade PA", "site": "https://www.miamidade.gov/Apps/PA/propertysearch"},
"palm beach": {"fetcher": "data_fetchers.pa_palm_beach:fetch_pa_palm_beach",
"name": "Palm Beach County PA", "site": "https://pbcpao.gov"},
"duval": {"fetcher": "data_fetchers.pa_duval:fetch_pa_duval",
"name": "Duval County PA (Jacksonville)", "site": "https://www.coj.net/departments/property-appraiser"},
# Condados con sitio PA oficial (scraping genérico o referencia)
"st. johns": {"site": "https://www.sjcpa.us",
"name": "St. Johns County PA (St. Augustine)"},
"saint johns":{"site": "https://www.sjcpa.us",
"name": "St. Johns County PA (St. Augustine)"},
"volusia": {"site": "https://vcpa.volusia.org",
"name": "Volusia County PA (Daytona Beach)"},
"orange": {"site": "https://www.ocpafl.org",
"name": "Orange County PA (Orlando)"},
"hillsborough":{"site": "https://www.hcpafl.org",
"name": "Hillsborough County PA (Tampa)"},
"pinellas": {"site": "https://www.pcpao.gov",
"name": "Pinellas County PA (St. Petersburg/Clearwater)"},
"seminole": {"site": "https://www.scpafl.org",
"name": "Seminole County PA (Sanford/Altamonte)"},
"osceola": {"site": "https://www.property-appraiser.org",
"name": "Osceola County PA (Kissimmee)"},
"brevard": {"site": "https://www.bcpao.us",
"name": "Brevard County PA (Melbourne/Cocoa)"},
"indian river":{"site": "https://www.ircpa.org",
"name": "Indian River County PA (Vero Beach)"},
"martin": {"site": "https://www.pa.martin.fl.us",
"name": "Martin County PA (Stuart/Hobe Sound)"},
"st. lucie": {"site": "https://www.paslc.gov",
"name": "St. Lucie County PA (Port St. Lucie/Fort Pierce)"},
"saint lucie":{"site": "https://www.paslc.gov",
"name": "St. Lucie County PA"},
"lee": {"site": "https://www.leepa.org",
"name": "Lee County PA (Fort Myers/Cape Coral)"},
"collier": {"site": "https://www.collierappraiser.com",
"name": "Collier County PA (Naples/Marco Island)"},
"charlotte": {"site": "https://www.ccappraiser.com",
"name": "Charlotte County PA (Port Charlotte/Punta Gorda)"},
"sarasota": {"site": "https://www.sc-pa.com",
"name": "Sarasota County PA"},
"manatee": {"site": "https://www.manateepao.gov",
"name": "Manatee County PA (Bradenton)"},
"polk": {"site": "https://www.polkpa.org",
"name": "Polk County PA (Lakeland/Winter Haven)"},
"pasco": {"site": "https://www.pascopa.com",
"name": "Pasco County PA (New Port Richey/Wesley Chapel)"},
"hernando": {"site": "https://www.hernandopa-fl.us",
"name": "Hernando County PA (Spring Hill/Brooksville)"},
"citrus": {"site": "https://www.citruspa.org",
"name": "Citrus County PA (Crystal River/Inverness)"},
"marion": {"site": "https://www.pa.marion.fl.us",
"name": "Marion County PA (Ocala)"},
"alachua": {"site": "https://www.acpafl.org",
"name": "Alachua County PA (Gainesville)"},
"putnam": {"site": "https://www.putnam-fl.com/pa",
"name": "Putnam County PA (Palatka)"},
"flagler": {"site": "https://www.flaglerpa.com",
"name": "Flagler County PA (Palm Coast/Flagler Beach)"},
"clay": {"site": "https://www.ccpao.com",
"name": "Clay County PA (Fleming Island/Orange Park)"},
"nassau": {"site": "https://www.nassauflpa.com",
"name": "Nassau County PA (Fernandina Beach/Yulee)"},
"baker": {"site": "https://www.bakerpa.com",
"name": "Baker County PA (Macclenny)"},
"columbia": {"site": "https://www.columbiapafl.com",
"name": "Columbia County PA (Lake City)"},
"leon": {"site": "https://www.leonpa.org",
"name": "Leon County PA (Tallahassee)"},
"escambia": {"site": "https://www.escpa.org",
"name": "Escambia County PA (Pensacola)"},
"santa rosa": {"site": "https://www.srcpa.org",
"name": "Santa Rosa County PA (Milton/Gulf Breeze)"},
"okaloosa": {"site": "https://www.okaloosapa.com",
"name": "Okaloosa County PA (Fort Walton Beach/Destin)"},
"walton": {"site": "https://www.waltonpa.com",
"name": "Walton County PA (Destin/30A/DeFuniak Springs)"},
"bay": {"site": "https://www.baycopa.com",
"name": "Bay County PA (Panama City)"},
"monroe": {"site": "https://www.mcpafl.org",
"name": "Monroe County PA (Florida Keys)"},
"lake": {"site": "https://www.lakepa.org",
"name": "Lake County PA (Leesburg/Tavares/Mount Dora)"},
"sumter": {"site": "https://www.sumterpa.com",
"name": "Sumter County PA (The Villages/Bushnell)"},
}
def _match_county(county: str) -> dict | None:
"""Encuentra el PA info para un condado dado."""
c = county.lower().strip()
# Coincidencia exacta primero
if c in COUNTY_PA_MAP:
return COUNTY_PA_MAP[c]
# Coincidencia parcial
for key, val in COUNTY_PA_MAP.items():
if key in c or c in key:
return val
return None
def run(lat: float, lon: float, address: str, county: str = "") -> dict:
"""Recopila datos de valoración inmobiliaria."""
result = {
"estimated_value": None,
"price_per_sqft": None,
"appreciation_1y": None,
"appreciation_3y": None,
"days_on_market": None,
"median_list_price": None,
"inventory": None,
"county_assessed_value": None,
"county_market_value": None,
"pa_site": None,
"pa_name": None,
"sources": [],
"errors": [],
}
# --- Zillow ---
try:
z = _zillow_neighborhood(lat, lon, address)
result.update({k: v for k, v in z.items() if v is not None})
result["sources"].append("Zillow")
except Exception as e:
result["errors"].append(f"Zillow: {e}")
# --- County Property Appraiser ---
pa_info = _match_county(county)
if pa_info:
result["pa_name"] = pa_info.get("name", "")
result["pa_site"] = pa_info.get("site", "")
fetcher_ref = pa_info.get("fetcher")
if fetcher_ref:
try:
module_path, func_name = fetcher_ref.split(":")
import importlib
mod = importlib.import_module(module_path)
fetch_fn = getattr(mod, func_name)
pa = fetch_fn(address)
if pa:
result["county_assessed_value"] = pa.get("assessed_value")
result["county_market_value"] = pa.get("market_value")
result["sources"].append(pa_info["name"])
except Exception as e:
result["errors"].append(f"{pa_info.get('name','PA')}: {e}")
else:
# Sin fetcher dedicado — registrar el sitio como referencia
result["sources"].append(f"{pa_info['name']} (referencia)")
else:
result["errors"].append(
f"County Appraiser no mapeado para: '{county}'. "
"Consulta manualemente en floridapropertytax.org"
)
return result
def _zillow_neighborhood(lat: float, lon: float, address: str) -> dict:
"""Scraping básico de Zillow para datos del vecindario."""
# Buscar ZIP de la dirección
zip_m = re.search(r"\b(\d{5})\b", address)
zip_code = zip_m.group(1) if zip_m else ""
if not zip_code:
raise ValueError("No se encontró ZIP code en la dirección")
url = f"https://www.zillow.com/homes/{zip_code}_rb/"
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36",
"Accept-Language": "en-US,en;q=0.9",
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
}
time.sleep(3) # rate limiting
r = requests.get(url, headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
soup = BeautifulSoup(r.text, "html.parser")
# Extraer datos estructurados si están disponibles (script tags con JSON)
result = {}
for script in soup.find_all("script", type="application/json"):
try:
import json
data = json.loads(script.string or "")
# Buscar datos de precio en la estructura JSON de Zillow
if isinstance(data, dict):
props = data.get("cat1", {}).get("searchResults", {}).get("listResults", [])
if props:
prices = [p.get("price", 0) for p in props if p.get("price")]
if prices:
result["median_list_price"] = sorted(prices)[len(prices) // 2]
sqfts = [p.get("price", 0) / p.get("area", 1)
for p in props if p.get("price") and p.get("area")]
if sqfts:
result["price_per_sqft"] = round(sum(sqfts) / len(sqfts))
doms = [p.get("daysOnZillow", 0) for p in props if p.get("daysOnZillow")]
if doms:
result["days_on_market"] = round(sum(doms) / len(doms))
result["inventory"] = len(props)
except Exception:
continue
return result
def score(data: dict) -> int:
"""Calcula score 0-100 de mercado inmobiliario."""
if not data:
return 50
s = 50 # base
# Apreciación 1 año (si disponible)
app1 = data.get("appreciation_1y")
if app1 is not None:
if app1 >= 10:
s += 20
elif app1 >= 5:
s += 12
elif app1 >= 0:
s += 5
else:
s -= 10
# Días en mercado (menos días = mercado más activo)
dom = data.get("days_on_market")
if dom is not None:
if dom <= 20:
s += 15
elif dom <= 40:
s += 8
elif dom <= 60:
s += 0
else:
s -= 10
# Precio por sqft como indicador de demanda
ppsf = data.get("price_per_sqft")
if ppsf is not None:
if ppsf >= 300:
s += 10
elif ppsf >= 200:
s += 5
return min(100, max(0, s))
+151
View File
@@ -0,0 +1,151 @@
"""Sub-agente: Escuelas cercanas.
Fuente: GreatSchools.org (scraping) + Overpass API como fallback.
"""
from __future__ import annotations
import time
import requests
from bs4 import BeautifulSoup
from data_fetchers.base import USER_AGENT, DEFAULT_TIMEOUT
OVERPASS_URL = "https://overpass-api.de/api/interpreter"
def run(lat: float, lon: float, address: str) -> dict:
result = {
"schools": [],
"avg_rating": None,
"best_elementary": None,
"best_middle": None,
"best_high": None,
"sources": [],
"errors": [],
}
# --- GreatSchools ---
try:
gs = _greatschools(lat, lon)
result["schools"] = gs
result["sources"].append("GreatSchools.org")
except Exception as e:
result["errors"].append(f"GreatSchools: {e}")
# --- Fallback: Overpass (cuenta escuelas sin rating) ---
if not result["schools"]:
try:
op = _overpass_schools(lat, lon)
result["schools"] = op
result["sources"].append("OpenStreetMap/Overpass")
except Exception as e:
result["errors"].append(f"Overpass schools: {e}")
# Calcular promedio y mejores escuelas
rated = [s for s in result["schools"] if s.get("rating")]
if rated:
result["avg_rating"] = round(sum(s["rating"] for s in rated) / len(rated), 1)
elementary = [s for s in rated if s.get("level") == "elementary"]
middle = [s for s in rated if s.get("level") == "middle"]
high = [s for s in rated if s.get("level") == "high"]
if elementary:
result["best_elementary"] = max(elementary, key=lambda x: x["rating"])
if middle:
result["best_middle"] = max(middle, key=lambda x: x["rating"])
if high:
result["best_high"] = max(high, key=lambda x: x["rating"])
return result
def _greatschools(lat: float, lon: float) -> list:
"""Scraping de GreatSchools para escuelas cercanas."""
url = f"https://www.greatschools.org/search/search.page?lat={lat}&lon={lon}&distance=3&gradeLevels=e,m,h"
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36",
"Accept": "text/html,application/xhtml+xml",
}
time.sleep(2)
r = requests.get(url, headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
soup = BeautifulSoup(r.text, "html.parser")
schools = []
for card in soup.select(".school-card, [data-school-id]")[:15]:
name_el = card.select_one(".school-name, h2, h3")
rating_el = card.select_one(".gs-rating, [class*='rating']")
level_el = card.select_one(".school-type, .grade-range")
name = name_el.get_text(strip=True) if name_el else "Desconocida"
try:
rating = int(rating_el.get_text(strip=True).split("/")[0]) if rating_el else None
except (ValueError, AttributeError):
rating = None
level_text = level_el.get_text(strip=True).lower() if level_el else ""
if "elementary" in level_text or "k-5" in level_text or "k-6" in level_text:
level = "elementary"
elif "middle" in level_text or "6-8" in level_text:
level = "middle"
elif "high" in level_text or "9-12" in level_text:
level = "high"
else:
level = "other"
schools.append({"name": name, "rating": rating, "level": level, "source": "GreatSchools"})
return schools
def _overpass_schools(lat: float, lon: float, radius_m: int = 4800) -> list:
"""Fallback: escuelas desde OpenStreetMap."""
query = f"""
[out:json][timeout:25];
(
node["amenity"="school"](around:{radius_m},{lat},{lon});
way["amenity"="school"](around:{radius_m},{lat},{lon});
);
out body;
"""
time.sleep(1)
r = requests.post(OVERPASS_URL, data={"data": query},
headers={"User-Agent": USER_AGENT}, timeout=30)
r.raise_for_status()
elements = r.json().get("elements", [])
schools = []
for el in elements[:20]:
tags = el.get("tags", {})
name = tags.get("name", "Escuela sin nombre")
schools.append({"name": name, "rating": None, "level": "other", "source": "OSM"})
return schools
def score(data: dict) -> int:
"""Score 0-100 basado en rating promedio de escuelas."""
avg = data.get("avg_rating")
if avg is None:
count = len(data.get("schools", []))
# Si hay escuelas pero sin rating, score neutral-positivo
return 45 if count == 0 else 55
# GreatSchools rating 1-10 → score 0-100
if avg >= 9:
return 95
elif avg >= 8:
return 85
elif avg >= 7:
return 75
elif avg >= 6:
return 65
elif avg >= 5:
return 55
elif avg >= 4:
return 40
elif avg >= 3:
return 30
else:
return 20
+1
View File
@@ -0,0 +1 @@
"""Utilidades compartidas del módulo location_agent."""
+85
View File
@@ -0,0 +1,85 @@
"""Geocoder para location_agent.
Wrapper sobre el Census Geocoder existente en data_fetchers/census_geocode.py.
Si falla Census, intenta Nominatim (OpenStreetMap) como fallback gratuito.
"""
from __future__ import annotations
import sys
import time
from pathlib import Path
import requests
_PROJECT_ROOT = Path(__file__).resolve().parent.parent.parent
if str(_PROJECT_ROOT) not in sys.path:
sys.path.insert(0, str(_PROJECT_ROOT))
from data_fetchers.census_geocode import fetch_geocode
from data_fetchers.base import FetcherError, USER_AGENT, DEFAULT_TIMEOUT
NOMINATIM_URL = "https://nominatim.openstreetmap.org/search"
def geocode(address: str) -> dict:
"""Geocodifica una dirección USA. Census primero, Nominatim como fallback.
Returns dict con: address, lat, lon, city, state, zip, county,
county_fips, state_fips, tract_geoid, source
Raises ValueError si no se puede geocodificar.
"""
# 1. Census Geocoder (preferido — devuelve tract FIPS)
try:
result = fetch_geocode(address)
if result.get("lat") and result.get("lng"):
return {
"address": result.get("matched_address", address),
"lat": float(result["lat"]),
"lon": float(result["lng"]),
"city": result.get("city", ""),
"state": result.get("state", ""),
"zip": result.get("zip", ""),
"county": result.get("county_name", ""),
"county_fips": result.get("county_fips", ""),
"state_fips": result.get("state_fips", ""),
"tract_geoid": result.get("tract_geoid", ""),
"source": "census",
}
except (FetcherError, Exception):
pass
# 2. Nominatim fallback
try:
params = {
"q": address,
"format": "json",
"addressdetails": 1,
"limit": 1,
"countrycodes": "us",
}
headers = {"User-Agent": USER_AGENT}
time.sleep(1)
r = requests.get(NOMINATIM_URL, params=params, headers=headers, timeout=DEFAULT_TIMEOUT)
r.raise_for_status()
results = r.json()
if results:
m = results[0]
addr = m.get("address", {})
return {
"address": m.get("display_name", address),
"lat": float(m["lat"]),
"lon": float(m["lon"]),
"city": addr.get("city") or addr.get("town") or addr.get("village", ""),
"state": addr.get("state", ""),
"zip": addr.get("postcode", ""),
"county": addr.get("county", ""),
"county_fips": "",
"state_fips": "",
"tract_geoid": "",
"source": "nominatim",
}
except Exception:
pass
raise ValueError(f"No se pudo geocodificar: {address!r}")
+101
View File
@@ -0,0 +1,101 @@
"""Cliente Ollama para síntesis narrativa de location_agent.
Solo se usa para texto — los scores son determinísticos.
Env vars:
OLLAMA_MODEL: modelo (default: llama3.1:8b)
OLLAMA_HOST: URL del servidor (default: http://localhost:11434)
"""
from __future__ import annotations
import json
import os
def _model() -> str:
return os.getenv("OLLAMA_MODEL", "llama3.1:8b")
def is_available() -> bool:
try:
import requests
r = requests.get(f"{os.getenv('OLLAMA_HOST', 'http://localhost:11434')}/api/tags", timeout=3)
return r.status_code == 200
except Exception:
return False
def analyze_section(data: dict, section: str, address: str) -> str:
"""Narrativa de 2-3 párrafos para una sección del reporte."""
if not is_available():
return _auto_summary(data, section)
try:
import ollama
prompt = (
f"Analiza los siguientes datos de {section} para la ubicación: {address}\n\n"
"Sé objetivo y profesional. 2-3 párrafos. Solo hechos relevantes para inversión "
"inmobiliaria. Sin recomendaciones de compra. Responde en español.\n\n"
f"Datos:\n{json.dumps(data, indent=2, ensure_ascii=False)}"
)
resp = ollama.chat(
model=_model(),
messages=[{"role": "user", "content": prompt}],
options={"temperature": 0.3},
)
return resp["message"]["content"].strip()
except Exception as e:
return _auto_summary(data, section) + f"\n\n[Ollama no disponible: {e}]"
def executive_summary(all_scores: dict, address: str, overall: int) -> dict:
"""Genera resumen ejecutivo. Devuelve {summary, strengths, weaknesses}."""
if not is_available():
return _auto_executive(all_scores, overall)
try:
import ollama
scores_txt = "\n".join(f" - {k}: {v}/100" for k, v in all_scores.items())
prompt = (
f"Resumen ejecutivo de inteligencia de ubicación para inversión inmobiliaria.\n"
f"Dirección: {address}\nScore General: {overall}/100\n\nScores:\n{scores_txt}\n\n"
"Proporciona en JSON:\n"
'{"summary": "3-5 párrafos objetivos", '
'"strengths": ["fortaleza 1","fortaleza 2","fortaleza 3"], '
'"weaknesses": ["debilidad 1","debilidad 2","debilidad 3"]}\n'
"Sin recomendaciones de compra. En español."
)
resp = ollama.chat(
model=_model(),
messages=[{"role": "user", "content": prompt}],
options={"temperature": 0.3},
format="json",
)
parsed = json.loads(resp["message"]["content"])
return {
"summary": parsed.get("summary", ""),
"strengths": parsed.get("strengths", [])[:3],
"weaknesses": parsed.get("weaknesses", [])[:3],
}
except Exception as e:
r = _auto_executive(all_scores, overall)
r["summary"] += f"\n[Ollama no disponible: {e}]"
return r
def _auto_summary(data: dict, section: str) -> str:
if not data:
return f"Datos de {section} no disponibles."
lines = [f"Resumen automático — {section}:"]
for k, v in list(data.items())[:8]:
if isinstance(v, (str, int, float, bool)) and v not in ("", None):
lines.append(f"{k}: {v}")
return "\n".join(lines)
def _auto_executive(scores: dict, overall: int) -> dict:
ranked = sorted(scores.items(), key=lambda x: x[1], reverse=True)
return {
"summary": f"Score general: {overall}/100. Active Ollama para análisis narrativo detallado.",
"strengths": [f"{k}: {v}/100" for k, v in ranked[:3]],
"weaknesses": [f"{k}: {v}/100" for k, v in ranked[-3:]],
}