1import { ApifyClient } from 'apify-client';
2
3
4
5const client = new ApifyClient({
6 token: '<YOUR_API_TOKEN>',
7});
8
9
10const input = {
11 "startUrls": [
12 {
13 "url": "https://docs.apify.com/academy/scraping-basics-javascript"
14 }
15 ],
16 "useSitemaps": false,
17 "useLlmsTxt": false,
18 "respectRobotsTxtFile": true,
19 "crawlerType": "playwright:adaptive",
20 "includeUrlGlobs": [],
21 "excludeUrlGlobs": [],
22 "initialCookies": [],
23 "customHttpHeaders": {},
24 "signHttpRequests": false,
25 "proxyConfiguration": {
26 "useApifyProxy": true
27 },
28 "keepElementsCssSelector": "",
29 "removeElementsCssSelector": `nav, footer, script, style, noscript, svg, img[src^='data:'],
30 [role="alert"],
31 [role="banner"],
32 [role="dialog"],
33 [role="alertdialog"],
34 [role="region"][aria-label*="skip" i],
35 [aria-modal="true"]`,
36 "blockMedia": true,
37 "clickElementsCssSelector": "[aria-expanded=\"false\"]",
38 "storeSkippedUrls": false
39};
40
41
42const run = await client.actor("gip/website-content-crawler").call(input);
43
44
45console.log('Results from dataset');
46console.log(`💾 Check your data here: https://console.apify.com/storage/datasets/${run.defaultDatasetId}`);
47const { items } = await client.dataset(run.defaultDatasetId).listItems();
48items.forEach((item) => {
49 console.dir(item);
50});
51
52