Files
parcer/scraper/src/scraper.js
karishmas6 8ba8a6927c chore: lint
2024-04-20 00:51:38 +05:30

25 lines
791 B
JavaScript

import { PlaywrightCrawler, Configuration } from 'crawlee';
async function scrapeData(url, selectors) {
const scrapedData = [];
const crawler = new PlaywrightCrawler({
requestHandler: async ({ page, request }) => {
await page.goto(url);
console.log('Received selectors:', selectors);
for (const selector of selectors) {
const elementData = await page.$$eval(selector, elements => elements.map(el => el.textContent.trim()));
scrapedData.push(...elementData);
}
console.log('Scraped data:', scrapedData);
},
},
new Configuration({
persistStorage: false,
}));
await crawler.run([url]);
return scrapedData;
}
export default scrapeData;