Files
RSSHub/lib/v2/scitation/journal.js
Derek d8c3126570 fix(route): scitation - use Puppeteer due to the obstacle by cloudflare challenge (#10190)
* fix(route): scitation - use Puppeteer due to the obstacle by cloudflare challenge

* feat: update utils.js and journal.js

* feat: prepare for section.js

* feat: add section.js

* fix(section.js): fix "section" length undifine error

* feat: format

* update(docs): add puppeteer="1"
2022-07-13 19:35:09 +08:00

55 lines
1.8 KiB
JavaScript

const cheerio = require('cheerio');
const { puppeteerGet, renderDesc } = require('./utils');
const config = require('@/config').value;
module.exports = async (ctx) => {
const pub = ctx.params.pub;
const jrn = ctx.params.jrn;
const host = `https://${pub}.scitation.org`;
const jrnlUrl = `${host}/toc/${jrn}/current?size=all`;
// use Puppeteer due to the obstacle by cloudflare challenge
const browser = await require('@/utils/puppeteer')();
const { jrnlName, list } = await ctx.cache.tryGet(
jrnlUrl,
async () => {
const response = await puppeteerGet(jrnlUrl, browser);
const $ = cheerio.load(response);
const jrnlName = $('.header-journal-title').text();
const list = $('.card')
.toArray()
.map((item) => {
$(item).find('.access-text').remove();
const title = $(item).find('.hlFld-Title').text();
const authors = $(item).find('.entryAuthor.all').text();
const img = $(item).find('img').attr('src');
const link = $(item).find('.ref.nowrap').attr('href');
const doi = link.replace('/doi/full/', '');
const description = renderDesc(title, authors, doi, img);
return {
title,
link,
doi,
description,
};
});
return {
jrnlName,
list,
};
},
config.cache.routeExpire,
false
);
browser.close();
ctx.state.data = {
title: jrnlName,
link: jrnlUrl,
item: list,
allowEmpty: true,
};
};