Files
robot-proveedores/robot.js
2026-02-13 09:31:36 +00:00

206 lines
9.2 KiB
JavaScript

import { chromium } from 'playwright';
import pg from 'pg';
const { DATABASE_URL } = process.env;
if (!DATABASE_URL) {
console.error("❌ Error: No hay DATABASE_URL definida.");
process.exit(1);
}
const pool = new pg.Pool({ connectionString: DATABASE_URL, ssl: false });
const HEADLESS = true;
async function main() {
console.log("🤖 ROBOT MODO: ASPIRADORA INDUSTRIAL (CAPTURA TODO)");
while (true) {
const client = await pool.connect();
try {
const res = await client.query("SELECT * FROM provider_credentials WHERE status = 'active'");
const credentials = res.rows;
console.log(`📋 Cuentas activas: ${credentials.length}`);
for (const cred of credentials) {
let password = Buffer.from(cred.password_hash, 'base64').toString('utf-8');
console.log(`\n🔄 Escaneando ${cred.provider.toUpperCase()} (ID: ${cred.owner_id})...`);
if (cred.provider === 'multiasistencia') {
await runMultiasistencia(cred.owner_id, cred.username, password);
} else if (cred.provider === 'homeserve') {
await runHomeserve(cred.owner_id, cred.username, password);
}
await client.query("UPDATE provider_credentials SET last_sync = NOW() WHERE id = $1", [cred.id]);
}
} catch (e) {
console.error("❌ Error ciclo:", e.message);
} finally {
client.release();
}
console.log("\n💤 Durmiendo 15 minutos...");
await new Promise(r => setTimeout(r, 15 * 60 * 1000));
}
}
// ==========================================
// 🧹 MULTIASISTENCIA (EXTRACCIÓN TOTAL)
// ==========================================
async function runMultiasistencia(ownerId, user, pass) {
const browser = await chromium.launch({ headless: HEADLESS, args: ['--no-sandbox'] });
const context = await browser.newContext();
const page = await context.newPage();
try {
console.log("🌍 [Multi] Entrando...");
await page.goto('https://web.multiasistencia.com/w3multi/acceso.php', { timeout: 60000 });
const userInput = await page.$('input[name="usuario"]') || await page.$('input[type="text"]');
if(userInput) {
await userInput.fill(user);
await page.fill('input[type="password"]', pass);
await page.click('input[type="submit"]');
await page.waitForTimeout(4000);
}
await page.goto('https://web.multiasistencia.com/w3multi/frepasos_new.php?refresh=1', { waitUntil: 'domcontentloaded' });
const expedientes = await page.evaluate(() => {
const links = Array.from(document.querySelectorAll('a[href*="reparacion="]'));
return Array.from(new Set(links.map(a => a.href.match(/reparacion=(\d+)/)?.[1]).filter(Boolean)));
});
console.log(`🔍 [Multi] ${expedientes.length} expedientes.`);
for (const ref of expedientes) {
await page.goto(`https://web.multiasistencia.com/w3multi/repasos1.php?reparacion=${ref}`, { waitUntil: 'domcontentloaded' });
// --- LÓGICA AGRESIVA DE CAPTURA ---
const fullData = await page.evaluate(() => {
const data = {};
// 1. Recorrer TODAS las filas de TODAS las tablas
const rows = document.querySelectorAll('tr');
rows.forEach(row => {
const cells = Array.from(row.querySelectorAll('td, th'));
// Intentamos emparejar: Celda 1 (Clave) -> Celda 2 (Valor)
for (let i = 0; i < cells.length - 1; i++) {
let key = cells[i].innerText.trim().replace(':', '');
let val = cells[i+1]?.innerText.trim();
// Filtros de limpieza básicos
if (key.length > 2 && key.length < 60 && val && val.length > 0) {
// Si la clave ya existe, no la machacamos (o le añadimos un indice)
if (!data[key]) {
data[key] = val;
// Saltamos la celda de valor para no leerla como clave en la siguiente vuelta
i++;
}
}
}
});
// Asegurar mínimos (fallback)
if (!data.clientName) data.clientName = data["Nombre Cliente"] || data["Asegurado"] || "Desconocido";
if (!data.address) data.address = data["Dirección"] || data["Domicilio"] || data["Riesgo"] || "";
if (!data.phone) data.phone = (document.body.innerText.match(/[6789]\d{8}/) || [])[0] || "";
return data;
});
if (fullData && Object.keys(fullData).length > 2) {
await saveServiceToDB(ownerId, 'multiasistencia', ref, fullData);
}
}
} catch (e) { console.error("❌ [Multi]", e.message); } finally { await browser.close(); }
}
// ==========================================
// 🧹 HOMESERVE (EXTRACCIÓN TOTAL)
// ==========================================
async function runHomeserve(ownerId, user, pass) {
const browser = await chromium.launch({ headless: HEADLESS, args: ['--no-sandbox'] });
const page = await browser.newPage();
try {
console.log("🌍 [HomeServe] Entrando...");
await page.goto('https://www.clientes.homeserve.es/cgi-bin/fccgi.exe?w3exec=PROF_PASS', { timeout: 60000 });
if (await page.isVisible('input[name="CODIGO"]')) {
await page.fill('input[name="CODIGO"]', user);
await page.fill('input[type="password"]', pass);
await page.keyboard.press('Enter');
await page.waitForTimeout(5000);
}
await page.goto('https://www.clientes.homeserve.es/cgi-bin/fccgi.exe?w3exec=lista_servicios_total');
const refs = await page.evaluate(() => {
const filas = Array.from(document.querySelectorAll('table tr'));
const found = [];
filas.forEach(tr => {
const txt = tr.innerText;
const match = txt.match(/(\d{6,10})/);
if (match) found.push(match[1]);
});
return [...new Set(found)];
});
console.log(`🔍 [HomeServe] ${refs.length} expedientes.`);
for (const ref of refs) {
try {
await page.goto('https://www.clientes.homeserve.es/cgi-bin/fccgi.exe?w3exec=lista_servicios_total');
const link = await page.getByText(ref).first();
if (await link.isVisible()) {
await link.click();
await page.waitForTimeout(1500);
const fullData = await page.evaluate(() => {
const d = {};
// HomeServe suele ser tablas limpias: TR -> TD (Clave) | TD (Valor)
const rows = Array.from(document.querySelectorAll('tr'));
rows.forEach(r => {
const cells = r.querySelectorAll('td');
// Si tiene al menos 2 celdas
if(cells.length >= 2) {
const k = cells[0].innerText.toUpperCase().trim().replace(':', '');
const v = cells[1].innerText.trim();
if(k.length > 1 && v.length > 0) d[k] = v;
}
// A veces son tablas de 4 columnas (Clave | Valor | Clave | Valor)
if(cells.length >= 4) {
const k2 = cells[2].innerText.toUpperCase().trim().replace(':', '');
const v2 = cells[3].innerText.trim();
if(k2.length > 1 && v2.length > 0) d[k2] = v2;
}
});
// Mapeo mínimo
d.clientName = d["CLIENTE"] || d["ASEGURADO"] || "Desconocido";
d.phone = d["TELEFONOS"] || d["MOVIL"] || "";
d.address = d["DOMICILIO"] || d["DIRECCION"] || "";
if(d["POBLACION"]) d.address += ", " + d["POBLACION"];
return d;
});
if (fullData) {
await saveServiceToDB(ownerId, 'homeserve', ref, fullData);
}
}
} catch (errRef) { console.error(`⚠️ Error ref ${ref}`); }
}
} catch (e) { console.error("❌ [HomeServe]", e.message); } finally { await browser.close(); }
}
async function saveServiceToDB(ownerId, provider, ref, data) {
console.log(`💾 Guardando ${ref} con ${Object.keys(data).length} variables encontradas.`);
await pool.query(`
INSERT INTO scraped_services (owner_id, provider, service_ref, raw_data, status)
VALUES ($1, $2, $3, $4, 'pending')
ON CONFLICT (owner_id, provider, service_ref)
DO UPDATE SET raw_data = EXCLUDED.raw_data, created_at = NOW()
`, [ownerId, provider, ref, JSON.stringify(data)]);
}
main();