From 337763b89dd2e8b12c521c954e66b9c4f40dbd2b Mon Sep 17 00:00:00 2001 From: rjnishant530 Date: Thu, 2 Jan 2025 22:30:06 +0530 Subject: [PATCH 1/5] init --- lib/routes/visionias/namespace.ts | 8 + lib/routes/visionias/news-today.ts | 168 ++++++++++++++++++ .../visionias/templates/description.art | 6 + lib/routes/visionias/utils.ts | 1 + 4 files changed, 183 insertions(+) create mode 100644 lib/routes/visionias/namespace.ts create mode 100644 lib/routes/visionias/news-today.ts create mode 100644 lib/routes/visionias/templates/description.art create mode 100644 lib/routes/visionias/utils.ts diff --git a/lib/routes/visionias/namespace.ts b/lib/routes/visionias/namespace.ts new file mode 100644 index 00000000000000..311b0a695be1f2 --- /dev/null +++ b/lib/routes/visionias/namespace.ts @@ -0,0 +1,8 @@ +import type { Namespace } from '@/types'; + +export const namespace: Namespace = { + name: 'VisionIAS', + url: 'visionias.in', + lang: 'en', + categories: ['study'], +}; diff --git a/lib/routes/visionias/news-today.ts b/lib/routes/visionias/news-today.ts new file mode 100644 index 00000000000000..9366f009c5df8f --- /dev/null +++ b/lib/routes/visionias/news-today.ts @@ -0,0 +1,168 @@ +import { Data, DataItem, Route } from '@/types'; +import { baseUrl } from './utils'; +import dayjs from 'dayjs'; +import ofetch from '@/utils/ofetch'; +import { load } from 'cheerio'; +import { parseDate } from '@/utils/parse-date'; +import { art } from '@/utils/render'; +import path from 'node:path'; +import logger from '@/utils/logger'; + +export const route: Route = { + path: '/newsToday', + example: '/visionias/newsToday', + features: { + requireConfig: false, + requirePuppeteer: false, + antiCrawler: false, + supportBT: false, + supportPodcast: false, + supportScihub: false, + }, + radar: [ + { + source: ['visionias.in/current-affairs/news-today'], + target: '/newsToday', + }, + ], + name: 'News Today', + maintainers: ['Rjnishant530'], + handler, +}; + +async function handler(): Promise { + const currentYear = dayjs().year(); + const currentMonth = dayjs().month() + 1; + logger.info(`Getting news for month ${currentMonth} and year ${currentYear}`); + const response = await ofetch(`${baseUrl}/current-affairs/news-today/getbymonth?year=${currentYear}&month=${currentMonth}`); + + let items: any = []; + // let title = 'News Today'; + let currentUrl = ''; + if (response.length !== 0) { + currentUrl = response[0].url; + // title = response[0].formatted_published_at; + items = await processCurrentNews(currentUrl); + } + + return { + title: `News Today | Current Affairs | Vision IAS`, + link: `${baseUrl}${currentUrl === '' ? '/current-affairs/news-today/' : currentUrl}`, + description: 'News Today is a daily bulletin providing readers with a comprehensive overview of news developments, news types, and technical terms.', + language: 'en', + item: items, + image: `${baseUrl}/current-affairs/images/news-today-logo.svg`, + icon: `${baseUrl}/current-affairs/favicon.ico`, + logo: `${baseUrl}/current-affairs/favicon.ico`, + allowEmpty: true, + }; +} + +async function processCurrentNews(currentUrl) { + const response = await ofetch(`${baseUrl}${currentUrl}`); + const $ = load(response); + const items = $(`#table-of-content > ul > li > a`) + .toArray() + .map((item) => { + const link = $(item).attr('href'); + const title = $(item).clone().children('span').remove().end().text().trim(); + return { + title, + link: title === 'Also in News' ? link : `${baseUrl}${link}`, + guid: link, + }; + }); + + const normalNews: any = []; + const alsoInNews: any = []; + + for (const item of items) { + if (item.title === 'Also in News') { + alsoInNews.push(item); + } else { + normalNews.push(item); + } + } + const finalItems = await Promise.allSettled( + normalNews.map((item) => processOnePerPage(item)) + ); + const alsoInNewsItems = await processMultiplePerPage(alsoInNews[0]); + return [...finalItems.map((item) => (item.status === 'fulfilled' ? item.value : { title: 'Error : Something Went Wrong' })), ...alsoInNewsItems]; +} + +async function processMultiplePerPage(groupedItem) { + if (groupedItem.link === '') { + return groupedItem; + } + const response = await ofetch(groupedItem.link || ''); + const $$ = load(response); + const mainGroup = $$('main > div > div.mt-6 > div.flex > div.flex.mt-6 > div.flex > div.w-full'); + const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); + const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]'); + const items = shortArticles.map((_, element) => { + const title = $$(element).find('a > div > h1').text().trim(); + const id = $$(element).find('a').attr('href'); + const articleContent = $$(element).find('#article-content').html(); + const tags = $$(element) + .find('ul > li:contains("Tags :")') + .nextAll('li') + .toArray() + .map((tag) => $$(tag).text()); + const description = art(path.join(__dirname, 'templates/description.art'), { + heading: title, + articleContent, + }); + return { + title: `${title} | ${groupedItem.title}`, + pubDate: parseDate(postedDate), + category: tags, + description, + link: `${groupedItem.link}${id}`, + author: 'Vision IAS', + } as DataItem; + }); + return items; +} + +async function processOnePerPage(item) { + if (item.link === '') { + return item; + } + try { + const response = await ofetch(item.link || ''); + const $$ = load(response); + const content = $$('main > div > div.mt-6 > div.flex > div.flex.mt-6'); + const heading = content.find('div.space-y-4 > h1').text(); + const mainGroup = content.find('div.flex > div.w-full'); + const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); + const articleContent = mainGroup.find('#article-content'); + articleContent.find('figure').each((_, element) => { + $$(element).css('width', ''); + }); + const htmlContent = articleContent.html(); + const tags = mainGroup + .find('ul > li:contains("Tags :")') + .nextAll('li') + .toArray() + .map((tag) => $$(tag).text()); + const description = art(path.join(__dirname, 'templates/description.art'), { + heading, + articleContent: htmlContent, + }); + return { + title: item.title, + pubDate: parseDate(postedDate), + category: tags, + description, + link: item.link, + author: 'Vision IAS', + } as DataItem; + } catch { + return { + title: item.title, + description: 'Unable to Fetch', + link: item.link, + author: 'Vision IAS', + } as DataItem; + } +} diff --git a/lib/routes/visionias/templates/description.art b/lib/routes/visionias/templates/description.art new file mode 100644 index 00000000000000..d70868e84249b6 --- /dev/null +++ b/lib/routes/visionias/templates/description.art @@ -0,0 +1,6 @@ +{{ if heading }} +

{{ heading }}

+{{ /if }} +{{ if articleContent }} + {{@ articleContent }} +{{ /if }} \ No newline at end of file diff --git a/lib/routes/visionias/utils.ts b/lib/routes/visionias/utils.ts new file mode 100644 index 00000000000000..541aaa1d81c060 --- /dev/null +++ b/lib/routes/visionias/utils.ts @@ -0,0 +1 @@ +export const baseUrl = 'https://visionias.in'; From fc615eeb63569ef6e6231ec050a0e28eefeb4874 Mon Sep 17 00:00:00 2001 From: rjnishant530 Date: Thu, 2 Jan 2025 22:40:00 +0530 Subject: [PATCH 2/5] fix __dir --- lib/routes/visionias/news-today.ts | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/lib/routes/visionias/news-today.ts b/lib/routes/visionias/news-today.ts index 9366f009c5df8f..a8a9458b92cb1b 100644 --- a/lib/routes/visionias/news-today.ts +++ b/lib/routes/visionias/news-today.ts @@ -1,4 +1,6 @@ import { Data, DataItem, Route } from '@/types'; +import { getCurrentPath } from '@/utils/helpers'; +const __dirname = getCurrentPath(import.meta.url); import { baseUrl } from './utils'; import dayjs from 'dayjs'; import ofetch from '@/utils/ofetch'; @@ -83,9 +85,7 @@ async function processCurrentNews(currentUrl) { normalNews.push(item); } } - const finalItems = await Promise.allSettled( - normalNews.map((item) => processOnePerPage(item)) - ); + const finalItems = await Promise.allSettled(normalNews.map((item) => processOnePerPage(item))); const alsoInNewsItems = await processMultiplePerPage(alsoInNews[0]); return [...finalItems.map((item) => (item.status === 'fulfilled' ? item.value : { title: 'Error : Something Went Wrong' })), ...alsoInNewsItems]; } From 98cdf181a239139e0bb6b92ee10a36fc6ecbb3b2 Mon Sep 17 00:00:00 2001 From: rjnishant530 Date: Fri, 3 Jan 2025 14:54:09 +0530 Subject: [PATCH 3/5] add news route --- lib/routes/visionias/news-today.ts | 138 +++++------------- .../visionias/templates/description-sub.art | 6 + .../visionias/templates/description.art | 10 +- lib/routes/visionias/utils.ts | 106 ++++++++++++++ lib/routes/visionias/weekly-focus.ts | 57 ++++++++ 5 files changed, 212 insertions(+), 105 deletions(-) create mode 100644 lib/routes/visionias/templates/description-sub.art create mode 100644 lib/routes/visionias/weekly-focus.ts diff --git a/lib/routes/visionias/news-today.ts b/lib/routes/visionias/news-today.ts index a8a9458b92cb1b..506993645673fa 100644 --- a/lib/routes/visionias/news-today.ts +++ b/lib/routes/visionias/news-today.ts @@ -1,17 +1,13 @@ -import { Data, DataItem, Route } from '@/types'; -import { getCurrentPath } from '@/utils/helpers'; -const __dirname = getCurrentPath(import.meta.url); -import { baseUrl } from './utils'; +import { Data, Route } from '@/types'; +import { baseUrl, extractNews } from './utils'; import dayjs from 'dayjs'; import ofetch from '@/utils/ofetch'; import { load } from 'cheerio'; -import { parseDate } from '@/utils/parse-date'; -import { art } from '@/utils/render'; -import path from 'node:path'; + import logger from '@/utils/logger'; export const route: Route = { - path: '/newsToday', + path: '/newsToday/:filter?', example: '/visionias/newsToday', features: { requireConfig: false, @@ -21,6 +17,16 @@ export const route: Route = { supportPodcast: false, supportScihub: false, }, + parameters: { + filter: { + description: 'Period to fetch news for the current month. All news for the current month or only the latest', + default: 'latest', + options: [ + { value: 'all', label: 'All' }, + { value: 'latest', label: 'Latest' }, + ], + }, + }, radar: [ { source: ['visionias.in/current-affairs/news-today'], @@ -32,7 +38,8 @@ export const route: Route = { handler, }; -async function handler(): Promise { +async function handler(ctx): Promise { + const filter = ctx.req.param('filter') ?? 'latest'; const currentYear = dayjs().year(); const currentMonth = dayjs().month() + 1; logger.info(`Getting news for month ${currentMonth} and year ${currentYear}`); @@ -40,16 +47,20 @@ async function handler(): Promise { let items: any = []; // let title = 'News Today'; - let currentUrl = ''; + if (response.length !== 0) { - currentUrl = response[0].url; - // title = response[0].formatted_published_at; - items = await processCurrentNews(currentUrl); + if (filter === 'latest') { + const currentUrl = response[0].url; + // title = response[0].formatted_published_at; + items = await processCurrentNews(currentUrl); + } else { + const results = await Promise.all(response.map((element) => processCurrentNews(element.url))); + items.push(...results.flat()); + } } - return { title: `News Today | Current Affairs | Vision IAS`, - link: `${baseUrl}${currentUrl === '' ? '/current-affairs/news-today/' : currentUrl}`, + link: `${baseUrl}/current-affairs/news-today/archive`, description: 'News Today is a daily bulletin providing readers with a comprehensive overview of news developments, news types, and technical terms.', language: 'en', item: items, @@ -74,95 +85,16 @@ async function processCurrentNews(currentUrl) { guid: link, }; }); - - const normalNews: any = []; - const alsoInNews: any = []; - - for (const item of items) { - if (item.title === 'Also in News') { - alsoInNews.push(item); + const newsPromises = await Promise.allSettled(items.map((item) => extractNews(item, 'main > div > div.mt-6 > div.flex > div.flex.mt-6'))); + const finalItems: any = []; + for (const news of newsPromises) { + if (news.status === 'fulfilled') { + finalItems.push(...(Array.isArray(news.value) ? news.value : [news.value])); } else { - normalNews.push(item); + finalItems.push({ + title: 'Error Parse News', + }); } } - const finalItems = await Promise.allSettled(normalNews.map((item) => processOnePerPage(item))); - const alsoInNewsItems = await processMultiplePerPage(alsoInNews[0]); - return [...finalItems.map((item) => (item.status === 'fulfilled' ? item.value : { title: 'Error : Something Went Wrong' })), ...alsoInNewsItems]; -} - -async function processMultiplePerPage(groupedItem) { - if (groupedItem.link === '') { - return groupedItem; - } - const response = await ofetch(groupedItem.link || ''); - const $$ = load(response); - const mainGroup = $$('main > div > div.mt-6 > div.flex > div.flex.mt-6 > div.flex > div.w-full'); - const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); - const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]'); - const items = shortArticles.map((_, element) => { - const title = $$(element).find('a > div > h1').text().trim(); - const id = $$(element).find('a').attr('href'); - const articleContent = $$(element).find('#article-content').html(); - const tags = $$(element) - .find('ul > li:contains("Tags :")') - .nextAll('li') - .toArray() - .map((tag) => $$(tag).text()); - const description = art(path.join(__dirname, 'templates/description.art'), { - heading: title, - articleContent, - }); - return { - title: `${title} | ${groupedItem.title}`, - pubDate: parseDate(postedDate), - category: tags, - description, - link: `${groupedItem.link}${id}`, - author: 'Vision IAS', - } as DataItem; - }); - return items; -} - -async function processOnePerPage(item) { - if (item.link === '') { - return item; - } - try { - const response = await ofetch(item.link || ''); - const $$ = load(response); - const content = $$('main > div > div.mt-6 > div.flex > div.flex.mt-6'); - const heading = content.find('div.space-y-4 > h1').text(); - const mainGroup = content.find('div.flex > div.w-full'); - const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); - const articleContent = mainGroup.find('#article-content'); - articleContent.find('figure').each((_, element) => { - $$(element).css('width', ''); - }); - const htmlContent = articleContent.html(); - const tags = mainGroup - .find('ul > li:contains("Tags :")') - .nextAll('li') - .toArray() - .map((tag) => $$(tag).text()); - const description = art(path.join(__dirname, 'templates/description.art'), { - heading, - articleContent: htmlContent, - }); - return { - title: item.title, - pubDate: parseDate(postedDate), - category: tags, - description, - link: item.link, - author: 'Vision IAS', - } as DataItem; - } catch { - return { - title: item.title, - description: 'Unable to Fetch', - link: item.link, - author: 'Vision IAS', - } as DataItem; - } + return finalItems; } diff --git a/lib/routes/visionias/templates/description-sub.art b/lib/routes/visionias/templates/description-sub.art new file mode 100644 index 00000000000000..e947d6315aa283 --- /dev/null +++ b/lib/routes/visionias/templates/description-sub.art @@ -0,0 +1,6 @@ +{{ if heading }} +

{{ heading }}

+{{ /if }} +{{ if articleContent }} + {{@ articleContent }} +{{ /if }} \ No newline at end of file diff --git a/lib/routes/visionias/templates/description.art b/lib/routes/visionias/templates/description.art index d70868e84249b6..2f92e6a1c8d17b 100644 --- a/lib/routes/visionias/templates/description.art +++ b/lib/routes/visionias/templates/description.art @@ -1,6 +1,12 @@ {{ if heading }}

{{ heading }}

{{ /if }} -{{ if articleContent }} - {{@ articleContent }} +{{ if subItems }} + {{ each subItems item }} + {{ if item?.description }} + {{@ item.description }} + {{ /if }} + {{ /each }} +{{else}} + {{@ articleContent }} {{ /if }} \ No newline at end of file diff --git a/lib/routes/visionias/utils.ts b/lib/routes/visionias/utils.ts index 541aaa1d81c060..dbba2841ddb6f9 100644 --- a/lib/routes/visionias/utils.ts +++ b/lib/routes/visionias/utils.ts @@ -1 +1,107 @@ +import { getCurrentPath } from '@/utils/helpers'; +const __dirname = getCurrentPath(import.meta.url); + +import { DataItem } from '@/types'; +import { parseDate } from '@/utils/parse-date'; +import { art } from '@/utils/render'; +import path from 'node:path'; +import ofetch from '@/utils/ofetch'; +import { load } from 'cheerio'; + export const baseUrl = 'https://visionias.in'; + +export async function extractNews(item, selector) { + if (item.link === '') { + return item; + } + const response = await ofetch(item.link || ''); + const $$ = load(response); + const content = $$(selector); + const heading = content.find('div.space-y-4 > h1').text(); + const mainGroup = content.find('div.flex > div.w-full'); + const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); + const updatedDate = mainGroup.find('p:contains("Updated ") > strong').text(); + const tags = mainGroup + .find('ul > li:contains("Tags :")') + ?.nextAll('li') + .toArray() + .map((tag) => $$(tag).text()); + const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]'); + const sections = mainGroup.find('[x-data^="{isSectionOpen"]'); + if (shortArticles.length !== 0) { + const items = shortArticles.toArray().map((element) => { + const mainDiv = $$(element); + const title = mainDiv.find('a > div > h1').text().trim(); + const id = mainDiv.find('a').attr('href'); + const htmlContent = extractArticle(mainDiv.html()); + const innerTags = mainDiv + .find('ul > li:contains("Tags :")') + ?.nextAll('li') + .toArray() + .map((tag) => $$(tag).text()); + const description = art(path.join(__dirname, `templates/description.art`), { + heading: title, + articleContent: htmlContent, + }); + return { + title: `${title} | ${heading}`, + pubDate: parseDate(postedDate), + category: innerTags, + description, + link: `${item.link}${id}`, + author: 'Vision IAS', + } as DataItem; + }); + return items; + } else if (sections.length === 0) { + const htmlContent = extractArticle(mainGroup.html()); + const description = art(path.join(__dirname, 'templates/description.art'), { + heading, + articleContent: htmlContent, + }); + return { + title: item.title, + pubDate: parseDate(postedDate), + category: tags, + description, + link: item.link, + updated: updatedDate ? parseDate(updatedDate) : null, + author: 'Vision IAS', + } as DataItem; + } else { + const items = sections.toArray().map((element) => { + const mainDiv = $$(element); + const title = mainDiv.find('a > div > h2').text().trim(); + const htmlContent = extractArticle(mainDiv.html(), 'div.ck-content'); + const description = art(path.join(__dirname, `templates/description-sub.art`), { + heading: title, + articleContent: htmlContent, + }); + return { description }; + }); + const description = art(path.join(__dirname, `templates/description.art`), { + heading, + subItems: items, + }); + return { + title: heading, + pubDate: parseDate(postedDate), + category: tags, + description, + link: item.link, + updated: updatedDate ? parseDate(updatedDate) : null, + author: 'Vision IAS', + } as DataItem; + } +} + +function extractArticle(articleDiv, selector: string = '#article-content') { + const $ = load(articleDiv, null, false); + const articleDiv$ = $(articleDiv); + const articleContent = articleDiv$.find(selector); + articleContent.find('figure').each((_, element) => { + $(element).css('width', ''); + }); + const htmlContent = articleContent.html(); + return htmlContent; +} diff --git a/lib/routes/visionias/weekly-focus.ts b/lib/routes/visionias/weekly-focus.ts new file mode 100644 index 00000000000000..e87d1b896f45bd --- /dev/null +++ b/lib/routes/visionias/weekly-focus.ts @@ -0,0 +1,57 @@ +import { Data, Route } from '@/types'; +import { baseUrl, extractNews } from './utils'; +import ofetch from '@/utils/ofetch'; +import { load } from 'cheerio'; + +export const route: Route = { + path: '/weeklyFocus', + example: '/visionias/weeklyFocus', + features: { + requireConfig: false, + requirePuppeteer: false, + antiCrawler: false, + supportBT: false, + supportPodcast: false, + supportScihub: false, + }, + radar: [ + { + source: ['visionias.in/current-affairs/weekly-focus'], + target: '/weeklyFocus', + }, + ], + name: 'Weekly Focus', + maintainers: ['Rjnishant530'], + handler, +}; + +async function handler(ctx): Promise { + const limit = ctx.req.query('limit') ? Number.parseInt(ctx.req.query('limit'), 10) : 1; + const response = await ofetch(`${baseUrl}/current-affairs/weekly-focus/archive`); + const $ = load(response); + const cards = $('div.weekly-focus-single-card').slice(0, limit).toArray(); + const individualLinks: any = []; + for (const card of cards) { + for (const item of $(card) + .find('a:has(p)') + .toArray()) { + const link = $(item).attr('href'); + individualLinks.push({ + link: link?.startsWith('http') ? link : `${baseUrl}${link}`, + }); + } + } + const itemsPromise = await Promise.allSettled(individualLinks.map(({ link }) => extractNews({ link }, 'main > div > div.flex > div.flex.w-full > div.w-full.mt-6'))); + + return { + title: `Weekly Focus | Current Affairs | Vision IAS`, + link: `${baseUrl}/current-affairs/weekly-focus/archive`, + description: 'Weekly Focus provides weekly comprehensive analysis of current themes with multidimensional and consolidated content.', + language: 'en', + item: itemsPromise.map((item) => (item.status === 'fulfilled' ? item.value : { title: 'Error Parse News' })), + image: `${baseUrl}/current-affairs/images/weekly-focus-logo.svg`, + icon: `${baseUrl}/current-affairs/favicon.ico`, + logo: `${baseUrl}/current-affairs/favicon.ico`, + allowEmpty: true, + }; +} From 73b07e9a6e8d4998b25e3b83150f620627bd61d8 Mon Sep 17 00:00:00 2001 From: rjnishant530 Date: Fri, 3 Jan 2025 14:59:57 +0530 Subject: [PATCH 4/5] not passing directly --- lib/routes/visionias/utils.ts | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/lib/routes/visionias/utils.ts b/lib/routes/visionias/utils.ts index dbba2841ddb6f9..92693a34b95c1f 100644 --- a/lib/routes/visionias/utils.ts +++ b/lib/routes/visionias/utils.ts @@ -95,10 +95,10 @@ export async function extractNews(item, selector) { } } -function extractArticle(articleDiv, selector: string = '#article-content') { +function extractArticle(articleDiv, selectorString: string = '#article-content') { const $ = load(articleDiv, null, false); const articleDiv$ = $(articleDiv); - const articleContent = articleDiv$.find(selector); + const articleContent = articleDiv$.find(String(selectorString)); articleContent.find('figure').each((_, element) => { $(element).css('width', ''); }); From 849da5d130eb533d87a94a7eed90eebe4983aa15 Mon Sep 17 00:00:00 2001 From: rjnishant530 Date: Sat, 4 Jan 2025 08:51:41 +0530 Subject: [PATCH 5/5] comment changes --- lib/routes/visionias/news-today.ts | 4 +- lib/routes/visionias/utils.ts | 144 ++++++++++++++------------- lib/routes/visionias/weekly-focus.ts | 19 ++-- 3 files changed, 84 insertions(+), 83 deletions(-) diff --git a/lib/routes/visionias/news-today.ts b/lib/routes/visionias/news-today.ts index 506993645673fa..d05e51313dc267 100644 --- a/lib/routes/visionias/news-today.ts +++ b/lib/routes/visionias/news-today.ts @@ -42,7 +42,7 @@ async function handler(ctx): Promise { const filter = ctx.req.param('filter') ?? 'latest'; const currentYear = dayjs().year(); const currentMonth = dayjs().month() + 1; - logger.info(`Getting news for month ${currentMonth} and year ${currentYear}`); + logger.debug(`Getting news for month ${currentMonth} and year ${currentYear}`); const response = await ofetch(`${baseUrl}/current-affairs/news-today/getbymonth?year=${currentYear}&month=${currentMonth}`); let items: any = []; @@ -59,7 +59,7 @@ async function handler(ctx): Promise { } } return { - title: `News Today | Current Affairs | Vision IAS`, + title: 'News Today | Current Affairs | Vision IAS', link: `${baseUrl}/current-affairs/news-today/archive`, description: 'News Today is a daily bulletin providing readers with a comprehensive overview of news developments, news types, and technical terms.', language: 'en', diff --git a/lib/routes/visionias/utils.ts b/lib/routes/visionias/utils.ts index 92693a34b95c1f..e9ebec22d51a16 100644 --- a/lib/routes/visionias/utils.ts +++ b/lib/routes/visionias/utils.ts @@ -7,6 +7,7 @@ import { art } from '@/utils/render'; import path from 'node:path'; import ofetch from '@/utils/ofetch'; import { load } from 'cheerio'; +import cache from '@/utils/cache'; export const baseUrl = 'https://visionias.in'; @@ -14,85 +15,86 @@ export async function extractNews(item, selector) { if (item.link === '') { return item; } - const response = await ofetch(item.link || ''); - const $$ = load(response); - const content = $$(selector); - const heading = content.find('div.space-y-4 > h1').text(); - const mainGroup = content.find('div.flex > div.w-full'); - const postedDate = mainGroup.find('p:contains("Posted ") > strong').text(); - const updatedDate = mainGroup.find('p:contains("Updated ") > strong').text(); - const tags = mainGroup - .find('ul > li:contains("Tags :")') - ?.nextAll('li') - .toArray() - .map((tag) => $$(tag).text()); - const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]'); - const sections = mainGroup.find('[x-data^="{isSectionOpen"]'); - if (shortArticles.length !== 0) { - const items = shortArticles.toArray().map((element) => { - const mainDiv = $$(element); - const title = mainDiv.find('a > div > h1').text().trim(); - const id = mainDiv.find('a').attr('href'); - const htmlContent = extractArticle(mainDiv.html()); - const innerTags = mainDiv - .find('ul > li:contains("Tags :")') - ?.nextAll('li') - .toArray() - .map((tag) => $$(tag).text()); - const description = art(path.join(__dirname, `templates/description.art`), { - heading: title, + return await cache.tryGet(item.link, async () => { + const response = await ofetch(item.link || ''); + const $$ = load(response); + const postedDate = String($$('meta[property="article:published_time"]').attr('content')); + const updatedDate = String($$('meta[property="article:modified_time"]').attr('content')); + const tags = $$('meta[property="article:tag"]') + .toArray() + .map((tag) => $$(tag).attr('content')); + const content = $$(selector); + const heading = content.find('div.space-y-4 > h1').text(); + const mainGroup = content.find('div.flex > div.w-full'); + + const shortArticles = mainGroup.find('[x-data^="{isShortArticleOpen"]'); + const sections = mainGroup.find('[x-data^="{isSectionOpen"]'); + if (shortArticles.length !== 0) { + const items = shortArticles.toArray().map((element) => { + const mainDiv = $$(element); + const title = mainDiv.find('a > div > h1').text().trim(); + const id = mainDiv.find('a').attr('href'); + const htmlContent = extractArticle(mainDiv.html()); + const innerTags = mainDiv + .find('ul > li:contains("Tags :")') + ?.nextAll('li') + .toArray() + .map((tag) => $$(tag).text()); + const description = art(path.join(__dirname, `templates/description.art`), { + heading: title, + articleContent: htmlContent, + }); + return { + title: `${title} | ${heading}`, + pubDate: parseDate(postedDate), + category: innerTags, + description, + link: `${item.link}${id}`, + author: 'Vision IAS', + } as DataItem; + }); + return items; + } else if (sections.length === 0) { + const htmlContent = extractArticle(mainGroup.html()); + const description = art(path.join(__dirname, 'templates/description.art'), { + heading, articleContent: htmlContent, }); return { - title: `${title} | ${heading}`, + title: item.title, pubDate: parseDate(postedDate), - category: innerTags, + category: tags, description, - link: `${item.link}${id}`, + link: item.link, + updated: updatedDate ? parseDate(updatedDate) : null, author: 'Vision IAS', } as DataItem; - }); - return items; - } else if (sections.length === 0) { - const htmlContent = extractArticle(mainGroup.html()); - const description = art(path.join(__dirname, 'templates/description.art'), { - heading, - articleContent: htmlContent, - }); - return { - title: item.title, - pubDate: parseDate(postedDate), - category: tags, - description, - link: item.link, - updated: updatedDate ? parseDate(updatedDate) : null, - author: 'Vision IAS', - } as DataItem; - } else { - const items = sections.toArray().map((element) => { - const mainDiv = $$(element); - const title = mainDiv.find('a > div > h2').text().trim(); - const htmlContent = extractArticle(mainDiv.html(), 'div.ck-content'); - const description = art(path.join(__dirname, `templates/description-sub.art`), { - heading: title, - articleContent: htmlContent, + } else { + const items = sections.toArray().map((element) => { + const mainDiv = $$(element); + const title = mainDiv.find('a > div > h2').text().trim(); + const htmlContent = extractArticle(mainDiv.html(), 'div.ck-content'); + const description = art(path.join(__dirname, `templates/description-sub.art`), { + heading: title, + articleContent: htmlContent, + }); + return { description }; }); - return { description }; - }); - const description = art(path.join(__dirname, `templates/description.art`), { - heading, - subItems: items, - }); - return { - title: heading, - pubDate: parseDate(postedDate), - category: tags, - description, - link: item.link, - updated: updatedDate ? parseDate(updatedDate) : null, - author: 'Vision IAS', - } as DataItem; - } + const description = art(path.join(__dirname, `templates/description.art`), { + heading, + subItems: items, + }); + return { + title: heading, + pubDate: parseDate(postedDate), + category: tags, + description, + link: item.link, + updated: updatedDate ? parseDate(updatedDate) : null, + author: 'Vision IAS', + } as DataItem; + } + }); } function extractArticle(articleDiv, selectorString: string = '#article-content') { diff --git a/lib/routes/visionias/weekly-focus.ts b/lib/routes/visionias/weekly-focus.ts index e87d1b896f45bd..65d55a478cffcb 100644 --- a/lib/routes/visionias/weekly-focus.ts +++ b/lib/routes/visionias/weekly-focus.ts @@ -30,21 +30,20 @@ async function handler(ctx): Promise { const response = await ofetch(`${baseUrl}/current-affairs/weekly-focus/archive`); const $ = load(response); const cards = $('div.weekly-focus-single-card').slice(0, limit).toArray(); - const individualLinks: any = []; - for (const card of cards) { - for (const item of $(card) + const individualLinks = cards.flatMap((card) => + $(card) .find('a:has(p)') - .toArray()) { + .toArray() + .map((item) => { const link = $(item).attr('href'); - individualLinks.push({ - link: link?.startsWith('http') ? link : `${baseUrl}${link}`, - }); - } - } + return { link: link?.startsWith('http') ? link : `${baseUrl}${link}` }; + }) + ); + const itemsPromise = await Promise.allSettled(individualLinks.map(({ link }) => extractNews({ link }, 'main > div > div.flex > div.flex.w-full > div.w-full.mt-6'))); return { - title: `Weekly Focus | Current Affairs | Vision IAS`, + title: 'Weekly Focus | Current Affairs | Vision IAS', link: `${baseUrl}/current-affairs/weekly-focus/archive`, description: 'Weekly Focus provides weekly comprehensive analysis of current themes with multidimensional and consolidated content.', language: 'en',