fix(kb.gbapp): HTML crawler improved.
This commit is contained in:
parent
5d0a58ee6d
commit
d694038532
1 changed files with 13 additions and 10 deletions
|
@ -1019,17 +1019,20 @@ export class KBService implements IGBKBService {
|
||||||
}
|
}
|
||||||
|
|
||||||
async getFreshPage(browser, url) {
|
async getFreshPage(browser, url) {
|
||||||
try {
|
if (!browser || browser.isConnected() === false) {
|
||||||
if (!browser || browser.isConnected() === false) {
|
browser = await puppeteer.launch({ headless: false });
|
||||||
browser = await puppeteer.launch({ headless: false }); // Change headless to true if you don't want to see the browser window
|
|
||||||
}
|
|
||||||
const page = await browser.newPage();
|
|
||||||
await page.goto(url);
|
|
||||||
return page;
|
|
||||||
} catch (error) {
|
|
||||||
console.error('An error occurred while getting fresh page:', error);
|
|
||||||
throw error;
|
|
||||||
}
|
}
|
||||||
|
const page = await browser.newPage();
|
||||||
|
try {
|
||||||
|
await page.goto(url, {
|
||||||
|
waitUntil: 'networkidle0', // Wait until network is idle
|
||||||
|
timeout: 30000 // 30 second timeout
|
||||||
|
});
|
||||||
|
} catch (err) {
|
||||||
|
// Ignore timeout/navigation errors
|
||||||
|
}
|
||||||
|
|
||||||
|
return page;
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
|
Loading…
Add table
Reference in a new issue