0.0.37 • Published 1 year ago
@soralinks/news-scrapers v0.0.37
news-scrapers
Scraping news organizations' websites for headlines
Install
npm install @soralinks/news-scrapers
Use in your app
import {
NewsScraperType,
NewsScraperResponse,
NewsScraperFactory
} from '@soralinks/news-scrapers';
(async () => {
const factory = new NewsScraperFactory();
const scrapers = await factory.createScrapers();
const results = await Promise.allSettled(
scrapers.map(async (scraper) => {
return scraper.scrape(NewsScraperType.POLITICS);
}),
);
// @ts-ignore
const scraperResponses: NewsScraperResponse[] = results.map(result => {
if (result.status === 'fulfilled') {
return result.value;
}
return undefined;
}).filter(Boolean);
console.log(`scraperResponses: ${JSON.stringify(scraperResponses, null, 2)}`);
})();
Logging
// To turn on logging, set the following environment variables:
// LOGGING_ABC_SCRAPER = 'on'
// LOGGING_AP_SCRAPER = 'on'
// LOGGING_BBC_SCRAPER = 'on'
// LOGGING_CNN_SCRAPER = 'on'
// LOGGING_DISPATCH_SCRAPER = 'on'
// LOGGING_CS_MONITOR_SCRAPER = 'on'
// LOGGING_EPOCH_TIMES_SCRAPER='on'
// LOGGING_FOX_SCRAPER = 'on'
// LOGGING_NEWSNATION_SCRAPER = 'on'
// LOGGING_NEWSWEEK_SCRAPER = 'on'
// LOGGING_NY_POST_SCRAPER = 'on'
// LOGGING_WASH_EXAM_SCRAPER = 'on'
// LOGGING_WSJ_SCRAPER = 'on'
// Note that error logging is always on
0.0.37
1 year ago
0.0.36
1 year ago
0.0.32
1 year ago
0.0.33
1 year ago
0.0.34
1 year ago
0.0.35
1 year ago
0.0.31
1 year ago
0.0.30
1 year ago
0.0.29
1 year ago
0.0.28
2 years ago
0.0.24
2 years ago
0.0.25
2 years ago
0.0.26
2 years ago
0.0.27
2 years ago
0.0.22
2 years ago
0.0.23
2 years ago
0.0.20
2 years ago
0.0.21
2 years ago
0.0.19
2 years ago
0.0.18
2 years ago
0.0.17
2 years ago
0.0.16
2 years ago
0.0.15
2 years ago
0.0.14
2 years ago
0.0.13
2 years ago
0.0.12
2 years ago
0.0.11
2 years ago
0.0.10
2 years ago
0.0.9
2 years ago
0.0.8
2 years ago
0.0.7
2 years ago
0.0.6
2 years ago
0.0.5
2 years ago
0.0.4
2 years ago
0.0.3
2 years ago
0.0.2
2 years ago
0.0.1
2 years ago