Files
RSSHub/lib/v2/sdu/cmse.js
Levi Zim 958be6266e feat(route): 山东大学(威海)新闻网 (#9537)
* feat(sduwh): add extractors.

* feat(route): add route for 山东大学(威海)新闻网

* docs: for route sduwh/news

* docs: for route sduwh/news

(cherry picked from commit 831830167a)

* feat(radar): for route 山东大学(威海)新闻网

* refactor: change `got.get` to `got`.

* refactor: prefer `parseDate()` to `new Date()`

Co-authored-by: Tony <TonyRL@users.noreply.github.com>

* fix: incomplete URL substring sanitization.

Make CodeQL happy.

* fix(radar): fix target field.

* fix: change route /sduwh to /sdu/wh

* fix: remove superfluous slash character in url.

* feat: look for exact date first.

* feat: extract exact date from news extractor.

* feat: extract exact date from view extractor.

* feat: extractor for www.sdrj.sdu.edu.cn

* refactor: semantic separation of sduwh with sdu

* feat(radar): more accurate name

* docs: update documentation

* refactor: migrate to v2

* refactor: fix deprecated url.resolve

* fix: update docs url

Co-authored-by: Tony <TonyRL@users.noreply.github.com>

* fix: sdu not working routes

* fix: accurate `ctx.state.data.url`

Co-authored-by: Tony <TonyRL@users.noreply.github.com>

* fix: better error handling for extractors.

* fix: timezone

Co-authored-by: Tony <TonyRL@users.noreply.github.com>

* fix: better error handling.

Co-authored-by: Tony <TonyRL@users.noreply.github.com>
2022-04-17 00:01:39 +08:00

60 lines
2.1 KiB
JavaScript

const got = require('@/utils/got');
const cheerio = require('cheerio');
const { parseDate } = require('@/utils/parse-date');
const host = 'http://www.cmse.sdu.edu.cn/';
const typelist = ['通知公告', '学院新闻', '本科生教育', '研究生教育', '学术动态'];
const urlList = ['zxzx/tzgg.htm', 'zxzx/xyxw.htm', 'zxzx/bksjy.htm', 'zxzx/yjsjy.htm', 'zxzx/xsdt.htm'];
module.exports = async (ctx) => {
const type = ctx.params.type ? parseInt(ctx.params.type) : 0;
const link = new URL(urlList[type], host).href;
const response = await got(link);
const $ = cheerio.load(response.data);
let item = $('.article_list li')
.map((_, e) => {
e = $(e);
const a = e.find('a');
return {
title: a.text().trim(),
link: a.attr('href'),
pubDate: parseDate(e.find('.date').text(), 'YYYY/MM/DD'),
};
})
.get();
item = await Promise.all(
item
.filter((e) => e.link.startsWith('../info'))
.map((item) => {
item.link = new URL(item.link.slice('3'), host).href;
return ctx.cache.tryGet(item.link, async () => {
const response = await got(item.link);
const $ = cheerio.load(response.data);
item.title = $('.contentTitle').text();
item.author =
$('.contentTitle2')
.find('span')
.eq(1)
.text()
.trim()
.match(/作者:(.*)/)[1] || '山东大学材料科学与工程学院';
$('.contentTitle, .contentTitle2').remove();
item.description = $('.content_detail').html();
return item;
});
})
);
ctx.state.data = {
title: `山东大学材料科学与工程学院${typelist[type]}`,
description: $('title').text(),
link,
item,
};
};