forked from philippta/flyscrape
-
Notifications
You must be signed in to change notification settings - Fork 0
/
template.js
27 lines (24 loc) · 1.2 KB
/
template.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
export const config = {
url: "https://news.ycombinator.com/", // Specify the URL to start scraping from.
// depth: 0, // Specify how deep links should be followed. (default = 0, no follow)
// allowedDomains: [], // Specify the allowed domains. ['*'] for all. (default = domain from url)
// blockedDomains: [], // Specify the blocked domains. (default = none)
// allowedURLs: [], // Specify the allowed URLs as regex. (default = all allowed)
// blockedURLs: [], // Specify the blocked URLs as regex. (default = non blocked)
// rate: 100, // Specify the rate in requests per second. (default = 100)
// cache: "file", // Enable file-based request caching. (default = no cache)
};
export default function({ doc, absoluteURL }) {
const title = doc.find("title");
const posts = doc.find(".athing");
return {
title: title.text(),
posts: posts.map((post) => {
const link = post.find(".titleline > a");
return {
title: link.text(),
url: absoluteURL(link.attr("href")),
};
}),
};
}