rsshub
Version:
Make RSS Great Again!
99 lines (81 loc) • 3 kB
text/typescript
import { Route } from '@/types';
import cache from '@/utils/cache';
import got from '@/utils/got';
import { load } from 'cheerio';
import { parseDate } from '@/utils/parse-date';
export const route: Route = {
path: '/:language?/:category?',
categories: ['new-media'],
example: '/swissinfo/eng/latest-news',
parameters: { language: 'Language, eng by default', category: 'Category, Latest News by default' },
features: {
requireConfig: false,
requirePuppeteer: false,
antiCrawler: false,
supportBT: false,
supportPodcast: false,
supportScihub: false,
},
radar: [
{
source: ['swissinfo.ch/:language/:category', 'swissinfo.ch/'],
},
],
name: 'Category',
maintainers: ['nczitzk'],
handler,
};
async function handler(ctx) {
const language = ctx.req.param('language') ?? 'eng';
const category = ctx.req.param('category') ?? 'latest-news';
const rootUrl = 'https://www.swissinfo.ch';
const currentUrl = `${rootUrl}/${language}/${category}`;
const response = await got({
method: 'get',
url: currentUrl,
});
let $ = load(response.data);
const title = $('title').text();
const fragmentResponse = await got({
method: 'get',
url: `${rootUrl}${$('main div[data-fragment-placeholder]').attr('data-fragment-placeholder')}`,
});
$ = load(fragmentResponse.data);
let items = $('.si-teaser__link')
.slice(0, ctx.req.query('limit') ? Number.parseInt(ctx.req.query('limit')) : 20)
.toArray()
.map((item) => {
item = $(item);
return {
link: `${rootUrl}${item.attr('href')}`,
title: item.find('.si-teaser__title').text(),
pubDate: parseDate(item.find('.si-teaser__date').attr('datetime')),
};
});
items = await Promise.all(
items.map((item) =>
cache.tryGet(item.link, async () => {
const detailResponse = await got({
method: 'get',
url: item.link,
});
const content = load(detailResponse.data);
content('.si-detail__content .si-grid').remove();
content('.si-detail__content .si-teaser').remove();
content('.show-for-sr, time, address, .si-detail__translation').remove();
content('picture').each(function () {
content(this).html(`<img src="${content(this).find('source').first().attr('srcset')}">`);
});
item.description = content('.si-detail__content').html();
item.author = content('meta[name="author"]').attr('content');
item.guid = detailResponse.data.match(/content_id: "(.*)",/)[1];
return item;
})
)
);
return {
title,
link: currentUrl,
item: items,
};
}