rsshub
Version:
Make RSS Great Again!
259 lines (231 loc) • 9.48 kB
text/typescript
import { type Data, type DataItem, type Route, ViewType } from '@/types';
import { art } from '@/utils/render';
import cache from '@/utils/cache';
import ofetch from '@/utils/ofetch';
import { parseDate } from '@/utils/parse-date';
import { type CheerioAPI, type Cheerio, load } from 'cheerio';
import type { Element } from 'domhandler';
import { type Context } from 'hono';
import path from 'node:path';
export const handler = async (ctx: Context): Promise<Data> => {
const { id = 'tzgg' } = ctx.req.param();
const limit: number = Number.parseInt(ctx.req.query('limit') ?? '10', 10);
const baseUrl: string = 'https://hitgs.hit.edu.cn';
const targetUrl: string = new URL(`${id}/list.htm`, baseUrl).href;
const response = await ofetch(targetUrl);
const $: CheerioAPI = load(response);
const language = $('html').attr('lang') ?? 'zh';
let items: DataItem[] = [];
items = $('li.news, div.tbt17')
.slice(0, limit)
.toArray()
.map((el): Element => {
const $el: Cheerio<Element> = $(el);
const title: string = $el.find('div.news_title, span.div.news_title, div.bttb2').text();
const description: string | undefined = art(path.join(__dirname, 'templates/description.art'), {
intro: $el.find('div.news_text, div.jj5').text(),
});
const pubDateStr: string | undefined = $('span.news_meta').text() || ($('span.news_days').text() ? `${$('span.news_days').text()}-${$('span.news_year').text()}` : `${$('div.tm-3').text()}-${$('div.tm-1').text()}`);
const linkUrl: string | undefined = $el.find('div.news_title a').attr('href') ?? $el.find('div.bttb2 a').attr('href') ?? $el.find('a').attr('href');
const upDatedStr: string | undefined = pubDateStr;
const processedItem: DataItem = {
title,
description,
pubDate: parseDate(pubDateStr),
link: linkUrl ? new URL(linkUrl, baseUrl).href : undefined,
content: {
html: description,
text: description,
},
updated: parseDate(upDatedStr),
language,
};
return processedItem;
});
items = await Promise.all(
items.map((item) => {
if (!item.link) {
return item;
}
return cache.tryGet(item.link, async (): Promise<DataItem> => {
const detailResponse = await ofetch(item.link);
const $$: CheerioAPI = load(detailResponse);
const title: string = $$('h1.arti_title').text() + $$('h2.arti_title').text();
const description: string | undefined = art(path.join(__dirname, 'templates/description.art'), {
description: $$('div.wp_articlecontent').html(),
});
const pubDateStr: string | undefined = $$('span.arti_update').text().split(/:/).pop()?.trim();
const upDatedStr: string | undefined = pubDateStr;
let processedItem: DataItem = {
title,
description,
pubDate: pubDateStr ? parseDate(pubDateStr) : item.pubDate,
content: {
html: description,
text: description,
},
updated: upDatedStr ? parseDate(upDatedStr) : item.updated,
language,
};
const $enclosureEl: Cheerio<Element> = $$('a[sudyfile-attr]')
.filter((_, el) => {
const $el: Cheerio<Element> = $$(el);
return !$el.attr('href')?.endsWith('htm');
})
.first();
const enclosureUrl: string | undefined = $enclosureEl.attr('href');
if (enclosureUrl) {
const enclosureType: string = `application/${enclosureUrl.split(/\./).pop() || 'octet-stream'}`;
const enclosureTitle: string | undefined = $enclosureEl.attr('sudyfile-attr')?.match(/'title':'(.*?)'/)?.[1];
processedItem = {
...processedItem,
enclosure_url: new URL(enclosureUrl, baseUrl).href,
enclosure_type: enclosureType,
enclosure_title: enclosureTitle || title,
};
}
return {
...item,
...processedItem,
};
});
})
);
const title: string = $('title').text();
const author: string = $('p.copyright span').first().text().split(/©/).pop() ?? '';
return {
title: `${author ? `${author} - ` : ''}${title}`,
description: title,
link: targetUrl,
item: items,
allowEmpty: true,
image: $('div.foot-logo img').attr('src'),
author,
language,
id: targetUrl,
};
};
export const route: Route = {
path: '/hitgs/:id?',
name: '研究生院',
url: 'hitgs.hit.edu.cn',
maintainers: ['hlmu', 'nczitzk'],
handler,
example: '/hit/hitgs/tzgg',
parameters: {
category: {
description: '分类,默认为 `tzgg`,即通知公告,可在对应分类页 URL 中找到',
options: [
{
label: '通知公告',
value: 'tzgg',
},
{
label: '综合新闻',
value: 'zhxw',
},
{
label: '高水平课程与学术交流',
value: 'gspkcyxsjl',
},
{
label: '国家政策',
value: 'gjzc',
},
{
label: '规章制度',
value: '17546',
},
{
label: '办事流程',
value: '17547',
},
{
label: '常见问题',
value: '17548',
},
{
label: '常见下载',
value: '17549',
},
],
},
},
description: `::: tip
订阅 [通知公告](https://hitgs.hit.edu.cn/tzgg/list.htm),其源网址为 \`https://hitgs.hit.edu.cn/tzgg/list.htm\`,请参考该 URL 指定部分构成参数,此时路由为 [\`/hit/hitgs/tzgg\`](https://rsshub.app/hit/hitgs/tzgg)。
:::
<details>
<summary>更多栏目</summary>
| 栏目 | ID |
| - | - |
| [通知公告](https://hitgs.hit.edu.cn/tzgg/list.htm) | [tzgg](https://rsshub.app/hit/hitgs/tzgg) |
| [综合新闻](https://hitgs.hit.edu.cn/zhxw/list.htm) | [zhxw](https://rsshub.app/hit/hitgs/zhxw) |
| [高水平课程与学术交流](https://hitgs.hit.edu.cn/gspkcyxsjl/list.htm) | [gspkcyxsjl](https://rsshub.app/hit/hitgs/gspkcyxsjl) |
| [国家政策](https://hitgs.hit.edu.cn/gjzc/list.htm) | [gjzc](https://rsshub.app/hit/hitgs/gjzc) |
| [规章制度](https://hitgs.hit.edu.cn/17546/list.htm) | [17546](https://rsshub.app/hit/hitgs/17546) |
| [办事流程](https://hitgs.hit.edu.cn/17547/list.htm) | [17547](https://rsshub.app/hit/hitgs/17547) |
| [常见问题](https://hitgs.hit.edu.cn/17548/list.htm) | [17548](https://rsshub.app/hit/hitgs/17548) |
| [常见下载](https://hitgs.hit.edu.cn/17549/list.htm) | [17549](https://rsshub.app/hit/hitgs/17549) |
</details>
`,
categories: ['university'],
features: {
requireConfig: false,
requirePuppeteer: false,
antiCrawler: false,
supportRadar: true,
supportBT: false,
supportPodcast: false,
supportScihub: false,
},
radar: [
{
source: ['hitgs.hit.edu.cn', 'hitgs.hit.edu.cn/:id/list.htm'],
target: (params) => {
const id: string = params.id;
return `/hit/hitgs${id ? `/${id}` : ''}`;
},
},
{
title: '通知公告',
source: ['hitgs.hit.edu.cn/tzgg/list.htm'],
target: '/hitgs/tzgg',
},
{
title: '综合新闻',
source: ['hitgs.hit.edu.cn/zhxw/list.htm'],
target: '/hitgs/zhxw',
},
{
title: '高水平课程与学术交流',
source: ['hitgs.hit.edu.cn/gspkcyxsjl/list.htm'],
target: '/hitgs/gspkcyxsjl',
},
{
title: '国家政策',
source: ['hitgs.hit.edu.cn/gjzc/list.htm'],
target: '/hitgs/gjzc',
},
{
title: '规章制度',
source: ['hitgs.hit.edu.cn/17546/list.htm'],
target: '/hitgs/17546',
},
{
title: '办事流程',
source: ['hitgs.hit.edu.cn/17547/list.htm'],
target: '/hitgs/17547',
},
{
title: '常见问题',
source: ['hitgs.hit.edu.cn/17548/list.htm'],
target: '/hitgs/17548',
},
{
title: '常见下载',
source: ['hitgs.hit.edu.cn/17549/list.htm'],
target: '/hitgs/17549',
},
],
view: ViewType.Articles,
};