'use strict'; const unprint = require('unprint'); const slugify = require('../utils/slugify'); const { convert } = require('../utils/convert'); const tryUrls = require('../utils/try-urls'); function scrapeAll(scenes, channel) { return scenes.map(({ query }) => { const release = {}; release.url = query.url('a'); release.entryId = slugify(new URL(release.url).pathname.match(/trailers\/(.*)/)[1]); release.title = query.content('h2 a'); release.actors = query.all('a[href*="models/"], a[href*="sets.php"]').map((actorEl) => ({ name: unprint.query.content(actorEl), url: unprint.query.url(actorEl, null, { origin: channel.url }), })); release.poster = query.img('.thumbnail img'); release.teaser = query.video('.thumbnail img', { attribute: 'data-vid' }); // not a mistake, video source is on img tag return release; }); } async function fetchLatest(channel, page = 1) { const url = `${channel.url}/porn-categories/movies/?sort=most-recent&page=${page}`; const res = await unprint.get(url, { selectAll: '.content div[data-setid]' }); if (res.ok) { return scrapeAll(res.context, channel); } return res.status; } function scrapeScene({ query }, { url }) { const release = {}; release.entryId = slugify(new URL(url).pathname.match(/trailers\/(.*)/)[1]); release.title = query.content('h1.title_bar'); release.description = query.content('.description-text'); release.date = query.date('//label[contains(text(), \'Date\')]/following-sibling::p[1]', 'YYYY-MM-DD'); release.actors = query.all('.text a[href*="/models"]').map((actorEl) => ({ name: unprint.query.content(actorEl), url: unprint.query.url(actorEl, null), })); release.tags = query.contents('.text a[href*="categories/"]'); release.poster = query.poster('#preview video'); release.trailer = query.video('#preview video source'); return release; } function scrapeProfile({ query }, { url }) { const profile = { url }; const bio = Object.fromEntries(query.all('.model-details > div').map((bioEl) => [ slugify(unprint.query.content(bioEl, 'h2'), '_'), unprint.query.text(bioEl), ])); profile.avatar = [ query.img('.model_bio_thumb', { attribute: 'src0_3x' }), query.img('.model_bio_thumb', { attribute: 'src0_2x' }), query.img('.model_bio_thumb', { attribute: 'src0_1x' }), ]; profile.description = [query.content('.model-bio-text'), bio.funfact].filter(Boolean).join(' '); profile.aliases = bio.alias?.split(/[,\n]/).map((alias) => alias.trim()); profile.age = parseInt(bio.age, 10) || null; profile.dateOfBirth = unprint.extractDate(bio.age, 'MM/DD/YYYY'); profile.measurements = bio.measurements; profile.height = Number(bio.height.match(/(\d+)\s*cm/)?.[1]) || convert(bio.height, 'cm'); return profile; } async function fetchProfile({ name: actorName, url: actorUrl }, { entity, include }) { const { res, url } = await tryUrls([ actorUrl, `${entity.url}/models/${slugify(actorName, '')}.html`, `${entity.url}/models/${slugify(actorName, '-')}.html`, ]); if (res.ok) { return scrapeProfile(res.context, { entity, include, url }); } return res.status; } module.exports = { fetchLatest, fetchProfile, scrapeScene, };