Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat(add route): VisionIAS route for daily news #18030

Merged
merged 5 commits into from
Jan 4, 2025
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 8 additions & 0 deletions lib/routes/visionias/namespace.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
import type { Namespace } from '@/types';

export const namespace: Namespace = {
name: 'VisionIAS',
url: 'visionias.in',
lang: 'en',
categories: ['study'],
};
100 changes: 100 additions & 0 deletions lib/routes/visionias/news-today.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
import { Data, Route } from '@/types';
import { baseUrl, extractNews } from './utils';
import dayjs from 'dayjs';
import ofetch from '@/utils/ofetch';
import { load } from 'cheerio';

import logger from '@/utils/logger';

export const route: Route = {
path: '/newsToday/:filter?',
example: '/visionias/newsToday',
features: {
requireConfig: false,
requirePuppeteer: false,
antiCrawler: false,
supportBT: false,
supportPodcast: false,
supportScihub: false,
},
parameters: {
filter: {
description: 'Period to fetch news for the current month. All news for the current month or only the latest',
default: 'latest',
options: [
{ value: 'all', label: 'All' },
{ value: 'latest', label: 'Latest' },
],
},
},
radar: [
{
source: ['visionias.in/current-affairs/news-today'],
target: '/newsToday',
},
],
name: 'News Today',
maintainers: ['Rjnishant530'],
handler,
};

async function handler(ctx): Promise<Data> {
const filter = ctx.req.param('filter') ?? 'latest';
const currentYear = dayjs().year();
const currentMonth = dayjs().month() + 1;
logger.debug(`Getting news for month ${currentMonth} and year ${currentYear}`);
const response = await ofetch(`${baseUrl}/current-affairs/news-today/getbymonth?year=${currentYear}&month=${currentMonth}`);

let items: any = [];
// let title = 'News Today';

if (response.length !== 0) {
if (filter === 'latest') {
const currentUrl = response[0].url;
// title = response[0].formatted_published_at;
items = await processCurrentNews(currentUrl);
} else {
const results = await Promise.all(response.map((element) => processCurrentNews(element.url)));
items.push(...results.flat());
}
}
return {
title: 'News Today | Current Affairs | Vision IAS',
link: `${baseUrl}/current-affairs/news-today/archive`,
description: 'News Today is a daily bulletin providing readers with a comprehensive overview of news developments, news types, and technical terms.',
language: 'en',
item: items,
image: `${baseUrl}/current-affairs/images/news-today-logo.svg`,
icon: `${baseUrl}/current-affairs/favicon.ico`,
logo: `${baseUrl}/current-affairs/favicon.ico`,
allowEmpty: true,
};
}

async function processCurrentNews(currentUrl) {
const response = await ofetch(`${baseUrl}${currentUrl}`);
const $ = load(response);
const items = $(`#table-of-content > ul > li > a`)
.toArray()
.map((item) => {
const link = $(item).attr('href');
const title = $(item).clone().children('span').remove().end().text().trim();
return {
title,
link: title === 'Also in News' ? link : `${baseUrl}${link}`,
guid: link,
};
});
const newsPromises = await Promise.allSettled(items.map((item) => extractNews(item, 'main > div > div.mt-6 > div.flex > div.flex.mt-6')));
const finalItems: any = [];
for (const news of newsPromises) {
if (news.status === 'fulfilled') {
finalItems.push(...(Array.isArray(news.value) ? news.value : [news.value]));
} else {
finalItems.push({
title: 'Error Parse News',
});
}
}
return finalItems;
}
6 changes: 6 additions & 0 deletions lib/routes/visionias/templates/description-sub.art
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
{{ if heading }}
<h2>{{ heading }}</h2>
{{ /if }}
{{ if articleContent }}
{{@ articleContent }}
{{ /if }}
12 changes: 12 additions & 0 deletions lib/routes/visionias/templates/description.art
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
{{ if heading }}
<h1>{{ heading }}</h1>
{{ /if }}
{{ if subItems }}
{{ each subItems item }}
{{ if item?.description }}
{{@ item.description }}
{{ /if }}
{{ /each }}
{{else}}
{{@ articleContent }}
{{ /if }}
109 changes: 109 additions & 0 deletions lib/routes/visionias/utils.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,109 @@
import { getCurrentPath } from '@/utils/helpers';
const __dirname = getCurrentPath(import.meta.url);

import { DataItem } from '@/types';
import { parseDate } from '@/utils/parse-date';
import { art } from '@/utils/render';
import path from 'node:path';
import ofetch from '@/utils/ofetch';
import { load } from 'cheerio';
import cache from '@/utils/cache';

export const baseUrl = 'https://visionias.in';

export async function extractNews(item, selector) {
Rjnishant530 marked this conversation as resolved.
Show resolved Hide resolved
if (item.link === '') {
return item;
}
return await cache.tryGet(item.link, async () => {
const response = await ofetch(item.link || '');
const $$ = load(response);
const postedDate = String($$('meta[property="article:published_time"]').attr('content'));
const updatedDate = String($$('meta[property="article:modified_time"]').attr('content'));
const tags = $$('meta[property="article:tag"]')
.toArray()
.map((tag) => $$(tag).attr('content'));
const content = $$(selector);
const heading = content.find('div.space-y-4 > h1').text();
const mainGroup = content.find('div.flex > div.w-full');

const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]');
const sections = mainGroup.find('[x-data^="{isSectionOpen"]');
if (shortArticles.length !== 0) {
const items = shortArticles.toArray().map((element) => {
const mainDiv = $$(element);
const title = mainDiv.find('a > div > h1').text().trim();
const id = mainDiv.find('a').attr('href');
const htmlContent = extractArticle(mainDiv.html());
const innerTags = mainDiv
.find('ul > li:contains("Tags :")')
?.nextAll('li')
.toArray()
.map((tag) => $$(tag).text());
const description = art(path.join(__dirname, `templates/description.art`), {
heading: title,
articleContent: htmlContent,
});
return {
title: `${title} | ${heading}`,
pubDate: parseDate(postedDate),
category: innerTags,
description,
link: `${item.link}${id}`,
author: 'Vision IAS',
} as DataItem;
});
return items;
} else if (sections.length === 0) {
const htmlContent = extractArticle(mainGroup.html());
const description = art(path.join(__dirname, 'templates/description.art'), {
heading,
articleContent: htmlContent,
});
return {
title: item.title,
pubDate: parseDate(postedDate),
category: tags,
description,
link: item.link,
updated: updatedDate ? parseDate(updatedDate) : null,
author: 'Vision IAS',
} as DataItem;
} else {
const items = sections.toArray().map((element) => {
const mainDiv = $$(element);
const title = mainDiv.find('a > div > h2').text().trim();
const htmlContent = extractArticle(mainDiv.html(), 'div.ck-content');
const description = art(path.join(__dirname, `templates/description-sub.art`), {
heading: title,
articleContent: htmlContent,
});
return { description };
});
const description = art(path.join(__dirname, `templates/description.art`), {
heading,
subItems: items,
});
return {
title: heading,
pubDate: parseDate(postedDate),
category: tags,
description,
link: item.link,
updated: updatedDate ? parseDate(updatedDate) : null,
author: 'Vision IAS',
} as DataItem;
}
});
}

function extractArticle(articleDiv, selectorString: string = '#article-content') {
const $ = load(articleDiv, null, false);
const articleDiv$ = $(articleDiv);
const articleContent = articleDiv$.find(String(selectorString));
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

selectorString is already a string. Do not recast the same type.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

lint is throwing error.

Prevent passing a function reference directly to iterator methods.
Do not pass function selector directly to .find(…).

articleContent.find('figure').each((_, element) => {
$(element).css('width', '');
});
const htmlContent = articleContent.html();
return htmlContent;
}
56 changes: 56 additions & 0 deletions lib/routes/visionias/weekly-focus.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
import { Data, Route } from '@/types';
import { baseUrl, extractNews } from './utils';
import ofetch from '@/utils/ofetch';
import { load } from 'cheerio';

export const route: Route = {
path: '/weeklyFocus',
example: '/visionias/weeklyFocus',
features: {
requireConfig: false,
requirePuppeteer: false,
antiCrawler: false,
supportBT: false,
supportPodcast: false,
supportScihub: false,
},
radar: [
{
source: ['visionias.in/current-affairs/weekly-focus'],
target: '/weeklyFocus',
},
],
name: 'Weekly Focus',
maintainers: ['Rjnishant530'],
handler,
};

async function handler(ctx): Promise<Data> {
const limit = ctx.req.query('limit') ? Number.parseInt(ctx.req.query('limit'), 10) : 1;
const response = await ofetch(`${baseUrl}/current-affairs/weekly-focus/archive`);
const $ = load(response);
const cards = $('div.weekly-focus-single-card').slice(0, limit).toArray();
const individualLinks = cards.flatMap((card) =>
$(card)
.find('a:has(p)')
.toArray()
.map((item) => {
const link = $(item).attr('href');
return { link: link?.startsWith('http') ? link : `${baseUrl}${link}` };
})
);

const itemsPromise = await Promise.allSettled(individualLinks.map(({ link }) => extractNews({ link }, 'main > div > div.flex > div.flex.w-full > div.w-full.mt-6')));

return {
title: 'Weekly Focus | Current Affairs | Vision IAS',
link: `${baseUrl}/current-affairs/weekly-focus/archive`,
description: 'Weekly Focus provides weekly comprehensive analysis of current themes with multidimensional and consolidated content.',
language: 'en',
item: itemsPromise.map((item) => (item.status === 'fulfilled' ? item.value : { title: 'Error Parse News' })),
image: `${baseUrl}/current-affairs/images/weekly-focus-logo.svg`,
icon: `${baseUrl}/current-affairs/favicon.ico`,
logo: `${baseUrl}/current-affairs/favicon.ico`,
allowEmpty: true,
};
}
Loading