Apify 是一个强大的工具,用于创建和管理网络抓取任务。它支持多种抓取器,包括基于 Web 的抓取器、Cheerio 和 Puppeteer。下面是如何使用这些抓取器从 Apify 中获取数据的详细解释。
const Apify = require('apify');
Apify.main(async () => {
const requestQueue = await Apify.openRequestQueue();
await requestQueue.addRequest({ url: 'https://example.com' });
const crawler = new Apify.Crawler({
requestQueue,
handlePageFunction: async ({ request, page }) => {
const content = await page.content();
console.log(content);
}
});
await crawler.run();
});
const Apify = require('apify');
const cheerio = require('cheerio');
Apify.main(async () => {
const requestQueue = await Apify.openRequestQueue();
await requestQueue.addRequest({ url: 'https://example.com' });
const crawler = new Apify.Crawler({
requestQueue,
handlePageFunction: async ({ request, page }) => {
const content = await page.content();
const $ = cheerio.load(content);
console.log($('title').text());
}
});
await crawler.run();
});
const Apify = require('apify');
Apify.main(async () => {
const requestQueue = await Apify.openRequestQueue();
await requestQueue.addRequest({ url: 'https://example.com' });
const crawler = new Apify.PuppeteerCrawler({
requestQueue,
handlePageFunction: async ({ page, request }) => {
await page.waitForSelector('title');
const title = await page.title();
console.log(title);
}
});
await crawler.run();
});
通过上述方法和示例代码,你可以根据具体需求选择合适的抓取器来从 Apify 中获取所需的数据。
领取专属 10元无门槛券
手把手带您无忧上云