const activityFunction: AzureFunction = async function (
context: Context,
crawlerParameters: CrawlingParameters
) {
process.env.CRAWLEE_STORAGE_DIR = os.tmpdir();
const nettsider = new Set();
const crawler = new PuppeteerCrawler({
async requestHandler({ request, page, enqueueLinks }) {
nettsider.add({ title: await page.title(), url: request.url });
await enqueueLinks({ exclude: [/.pdf$/, /.doc$/] });
},
maxRequestsPerCrawl: crawlerParameters.maxLenker,
});
await crawler.run([crawlerParameters.startUrl]);
return Array.from(nettsider);
};
const activityFunction: AzureFunction = async function (
context: Context,
crawlerParameters: CrawlingParameters
) {
process.env.CRAWLEE_STORAGE_DIR = os.tmpdir();
const nettsider = new Set();
const crawler = new PuppeteerCrawler({
async requestHandler({ request, page, enqueueLinks }) {
nettsider.add({ title: await page.title(), url: request.url });
await enqueueLinks({ exclude: [/.pdf$/, /.doc$/] });
},
maxRequestsPerCrawl: crawlerParameters.maxLenker,
});
await crawler.run([crawlerParameters.startUrl]);
return Array.from(nettsider);
};