From 96aa034456c9eae74dafbf402c32402e46bcd4b3 Mon Sep 17 00:00:00 2001
From: MisteryMonster <40703811+MisteryMonster@users.noreply.github.com>
Date: Mon, 11 May 2020 18:37:21 +0800
Subject: [PATCH] =?UTF-8?q?feat:=20=E6=96=B0=E4=BA=AC=E6=8A=A5=E7=94=B5?=
=?UTF-8?q?=E5=AD=90=E6=8A=A5=20(#4725)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit
---
docs/traditional-media.md | 4 ++
lib/router.js | 1 +
lib/routes/bjnews/epaper.js | 80 +++++++++++++++++++++++++++++++++++++
3 files changed, 85 insertions(+)
mode change 100755 => 100644 lib/router.js
create mode 100644 lib/routes/bjnews/epaper.js
diff --git a/docs/traditional-media.md b/docs/traditional-media.md
index d494357c48..2fbe226a36 100644
--- a/docs/traditional-media.md
+++ b/docs/traditional-media.md
@@ -430,6 +430,10 @@ category 对应的关键词有
+### 电子报
+
+
+
## 新浪科技
### 科学探索
diff --git a/lib/router.js b/lib/router.js
old mode 100755
new mode 100644
index 62db2a41f5..f802af9758
--- a/lib/router.js
+++ b/lib/router.js
@@ -325,6 +325,7 @@ router.get('/smzdm/haowen/fenlei/:name/:sort?', require('./routes/smzdm/haowen_f
// 新京报
router.get('/bjnews/:cat', require('./routes/bjnews/news'));
+router.get('/bjnews/epaper/:cat', require('./routes/bjnews/epaper'));
// 停水通知
router.get('/tingshuitz/hangzhou', require('./routes/tingshuitz/hangzhou'));
diff --git a/lib/routes/bjnews/epaper.js b/lib/routes/bjnews/epaper.js
new file mode 100644
index 0000000000..45a9f72341
--- /dev/null
+++ b/lib/routes/bjnews/epaper.js
@@ -0,0 +1,80 @@
+const got = require('@/utils/got');
+const cheerio = require('cheerio');
+
+module.exports = async (ctx) => {
+ const cat = ctx.params.cat.toUpperCase();
+
+ const today = new Date();
+ const year = today.getFullYear(); // 获取时间
+ const month = String(today.getMonth() + 1).padStart(2, '0');
+ const day = String(today.getDate()).padStart(2, '0');
+ // 获取当天报纸的首页
+ const response = await got({
+ method: 'get',
+ url: `http://epaper.bjnews.com.cn/html/${year}-${month}/${day}/node_1.htm`,
+ });
+
+ const data = response.data;
+ const $ = cheerio.load(data);
+ const listdata = $('div#artcile_list_wapper tr').get();
+ // 根据必选参数判断是哪一叠
+ const list = cat.indexOf('SPECIAL') === -1 ? listdata.filter((e) => $(e).find('a').text().substring(1, 2) === cat) : listdata.filter((e) => $(e).find('a').text().substring(1, 2) === '0');
+ // 遍历该叠面里第N版导航链接,数组内容为A01头版内容,A02等
+ const articledata = await Promise.all(
+ list.map(async (item) => {
+ const link = `http://epaper.bjnews.com.cn/html/${year}-${month}/${day}/${$(item).find('a').attr('href')}`;
+ // 缓存某叠下版面链接
+ const cache = await ctx.cache.get(link);
+ if (cache) {
+ return Promise.resolve(JSON.parse(cache));
+ }
+
+ const response2 = await got({
+ method: 'get',
+ url: link,
+ });
+
+ const articleHtml = response2.data;
+ const $2 = cheerio.load(articleHtml);
+ const paperarea = $2('ul.jcul li').get();
+ // 遍历某板块,N版面的内容,到一个数组里。
+ const innercontents = await Promise.all(
+ paperarea.map(async (item) => {
+ const contentdataurl = `http://epaper.bjnews.com.cn/html/${year}-${month}/${day}/${$(item).find('a').attr('href')}`;
+ const response3 = await got({
+ method: 'get',
+ url: contentdataurl,
+ });
+
+ const contentHtml = response3.data;
+ const $3 = cheerio.load(contentHtml);
+
+ const ititle = $3('div.rit h1').text();
+ const iprecontent = $3('div.tpnr').html();
+ const imaincontent = $3('founder-content').html();
+ // 这里查看是正常输出的!
+ const icontent = `${ititle}
${iprecontent}${imaincontent}
`;
+ return Promise.resolve(icontent);
+ })
+ );
+ // end
+ const single = {
+ description: innercontents,
+ title: `${year}-${month}-${day}|${$(item).text()}`,
+ link,
+ };
+ ctx.cache.set(link, JSON.stringify(single));
+ return Promise.resolve(single);
+ })
+ );
+
+ ctx.state.data = {
+ title: `新京报电子报|${cat}叠`,
+ link: `http://epaper.bjnews.com.cn/html/${year}-${month}/${day}/node_1.htm`,
+ item: list.map((item, index) => ({
+ title: `${articledata[index].title}`,
+ description: `${articledata[index].description}`,
+ link: `${articledata[index].link}`,
+ })),
+ };
+};