node-csfd-api
Version:
ČSFD API in JavaScript. Amazing NPM library for scrapping csfd.cz :)
66 lines (64 loc) • 2.85 kB
JavaScript
import { fetchPage } from "../fetchers/index.mjs";
import { userReviewsUrl } from "../vars.mjs";
import { sleep } from "../helpers/global.helper.mjs";
import { getUserReviewColorRating, getUserReviewDate, getUserReviewId, getUserReviewPoster, getUserReviewRating, getUserReviewText, getUserReviewTitle, getUserReviewType, getUserReviewUrl, getUserReviewYear } from "../helpers/user-reviews.helper.mjs";
import { parse } from "node-html-parser";
//#region src/services/user-reviews.service.ts
var UserReviewsScraper = class {
async userReviews(user, config, options) {
let allReviews = [];
const pageToFetch = config?.page || 1;
const url = userReviewsUrl(user, pageToFetch > 1 ? pageToFetch : void 0, { language: options?.language });
const items = parse(await fetchPage(url, { ...options?.request }));
const reviews = items.querySelectorAll(".user-reviews .article");
const pagesNode = items.querySelector(".pagination");
const pages = +pagesNode?.childNodes[pagesNode.childNodes.length - 4].rawText || 1;
allReviews = this.getPage(config, reviews);
if (config?.allPages) {
console.log("User", user, url);
console.log("Fetching all pages", pages);
for (let i = 2; i <= pages; i++) {
console.log("Fetching page", i, "out of", pages, "...");
const reviews$1 = parse(await fetchPage(userReviewsUrl(user, i, { language: options?.language }), { ...options?.request })).querySelectorAll(".user-reviews .article");
allReviews = [...allReviews, ...this.getPage(config, reviews$1)];
if (config.allPagesDelay) await sleep(config.allPagesDelay);
}
return allReviews;
}
return allReviews;
}
getPage(config, reviews) {
const films = [];
if (config) {
if (config.includesOnly?.length && config.excludes?.length) console.warn(`node-csfd-api:
You can not use both parameters 'includesOnly' and 'excludes'.
Parameter 'includesOnly' will be used now:`, config.includesOnly);
}
for (const el of reviews) {
const type = getUserReviewType(el);
if (config?.includesOnly?.length) {
if (config.includesOnly.some((include) => type === include)) films.push(this.buildUserReviews(el));
} else if (config?.excludes?.length) {
if (!config.excludes.some((exclude) => type === exclude)) films.push(this.buildUserReviews(el));
} else films.push(this.buildUserReviews(el));
}
return films;
}
buildUserReviews(el) {
return {
id: getUserReviewId(el),
title: getUserReviewTitle(el),
year: getUserReviewYear(el),
type: getUserReviewType(el),
url: getUserReviewUrl(el),
colorRating: getUserReviewColorRating(el),
userDate: getUserReviewDate(el),
userRating: getUserReviewRating(el),
text: getUserReviewText(el),
poster: getUserReviewPoster(el)
};
}
};
//#endregion
export { UserReviewsScraper };
//# sourceMappingURL=user-reviews.service.mjs.map