const asyncPool = require('tiny-async-pool'); const ProcessFeed = async (items, cookies, browser, limit, cache) => { let newCookies = []; const result = []; for await (const item of asyncPool(3, items.slice(0, limit), async (i) => { const url = `https://www.dcard.tw/service/api/v2/posts/${i.id}`; const content = await cache.tryGet(`dcard:${i.id}`, async () => { let response; // try catch 处理被删除的帖子 try { const page = await browser.newPage(); await page.setRequestInterception(true); page.on('request', (request) => { request.resourceType() === 'document' || request.resourceType() === 'script' || request.resourceType() === 'fetch' || request.resourceType() === 'xhr' ? request.continue() : request.abort(); }); await page.setExtraHTTPHeaders({ referer: `https://www.dcard.tw/f/${i.forumAlias}/p/${i.id}`, }); await page.setCookie(...cookies); await page.goto(url); await page.waitForSelector('body > pre'); response = await page.evaluate(() => document.querySelector('body > pre').innerText); newCookies = await page.cookies(); await page.close(); const data = JSON.parse(response); let body = data.content; body = body.replace(/(?=https?:\/\/).*?(?<=\.(jpe?g|gif|png))/gi, (m) => ``); body = body.replace(/(?=https?:\/\/).*(??)$/gim, (m) => `${m}`); body = body.replace(/\n/g, '
'); return body; } catch (error) { return ''; } }); i.description = content; return i; })) { result.push(item); } await cache.set('dcard:cookies', newCookies, 3600); return [...result, ...items.slice(limit)]; }; module.exports = { ProcessFeed, };