From 3145ca84832b6e2d7108c048e9cfcab64e532d9e Mon Sep 17 00:00:00 2001 From: "Rodrigo Rodriguez (Pragmatismo)" Date: Fri, 26 Sep 2025 14:47:13 -0300 Subject: [PATCH] Remove images and CSS from crawled pages --- packages/kb.gbapp/services/KBService.ts | 25 +++++++++++++++++-------- 1 file changed, 17 insertions(+), 8 deletions(-) diff --git a/packages/kb.gbapp/services/KBService.ts b/packages/kb.gbapp/services/KBService.ts index 53988aa65..46e9b34cd 100644 --- a/packages/kb.gbapp/services/KBService.ts +++ b/packages/kb.gbapp/services/KBService.ts @@ -1208,14 +1208,23 @@ export class KBService implements IGBKBService { await min.core['setConfig'](min, 'Color1', colors[0].hex()); await min.core['setConfig'](min, 'Color2', colors[1].hex()); } - // Disables images in crawling. - await page.route('**/*', route => { - const type = route.request().resourceType(); - if (type === 'image' || type === 'stylesheet') { - route.abort(); - } else { - route.continue(); - } + + // Remove images and disable CSS after page loads + await page.evaluate(() => { + // Remove all images + document.querySelectorAll('img').forEach(img => img.remove()); + + // Disable all stylesheets + document.querySelectorAll('link[rel="stylesheet"]').forEach(link => { + link['disabled'] = true; + link.remove(); + }); + + // Remove inline styles + document.querySelectorAll('style').forEach(style => style.remove()); + + // Remove style attributes + document.querySelectorAll('[style]').forEach(el => el.removeAttribute('style')); }); page.on('dialog', async dialog => {