JDRssDownloader/LinkGrabber.js

45 lines
1.0 KiB
JavaScript
Raw Normal View History

2022-06-09 10:06:22 +01:00
const axios = require('axios');
var cheerio = require('cheerio');
2023-06-07 14:43:17 +01:00
async function flareSolverr(url) {
2023-06-06 16:42:28 +01:00
var data = JSON.stringify({
"cmd": "request.get",
"url": url,
"maxTimeout": 120000
});
var config = {
method: 'post',
url: 'http://127.0.01:8191/v1',
headers: {
'Content-Type': 'application/json'
},
data: data
};
res = await axios(config)
return res.data.solution.response
}
2022-06-09 10:06:22 +01:00
async function getLinksFromURL(url) {
try {
let links = [];
2023-06-07 14:43:17 +01:00
let scrape = await flareSolverr(url)
2023-06-06 16:42:28 +01:00
// let httpResponse = await axios.get(url);
2022-06-09 10:06:22 +01:00
2023-06-06 16:42:28 +01:00
let $ = cheerio.load(scrape);
2022-06-09 10:06:22 +01:00
let linkObjects = $('a'); // get all hyperlinks
linkObjects.each((index, element) => {
links.push(
$(element).attr('href'), // get the href attribute
);
});
return links;
} catch (e) { console.log(e) }
}
module.exports = {
getLinksFromURL
}