'use strict'; /* eslint-disable newline-per-chained-call */ const Promise = require('bluebird'); const moment = require('moment'); const logger = require('../logger')(__filename); const http = require('../utils/http'); const slugify = require('../utils/slugify'); const genderMap = { F: 'female', M: 'male', T: 'transsexual', // not yet observed }; function getPosterFallbacks(poster) { return poster .filter((image) => /landscape/i.test(image.name)) .sort((imageA, imageB) => imageB.height - imageA.height) .map((image) => { const sources = [image.src, image.highdpi?.['2x'], image.highdpi?.['3x']]; // high DPI images for full HD source are huge, only prefer for smaller fallback sources return image.height === 1080 ? sources : sources.reverse(); }) .flat() .map((src) => ({ src, expectType: { 'binary/octet-stream': 'image/jpeg', }, })); } function getTeaserFallbacks(teaser) { return teaser .filter((video) => /landscape/i.test(video.name)) .map((video) => ({ src: video.src, type: video.type, quality: Number(String(video.height).replace('353', '360')), })); } function getAvatarFallbacks(avatar) { return avatar .sort((imageA, imageB) => imageB.height - imageA.height) .map((image) => [image.highdpi?.['3x'], image.highdpi?.['2x'], image.src]) .flat(); } async function getTrailer(scene, channel, url) { const res = await http.post(`${channel.url}/graphql`, { operationName: 'getToken', variables: { videoId: scene.newId, device: 'trailer', }, query: ` query getToken($videoId: ID!, $device: Device!) { generateVideoToken(input: {videoId: $videoId, device: $device}) { p270 { token cdn __typename } p360 { token cdn __typename } p480 { token cdn __typename } p480l { token cdn __typename } p720 { token cdn __typename } p1080 { token cdn __typename } p2160 { token cdn __typename } hls { token cdn __typename } __typename } } `, }, { headers: { referer: url, origin: channel.url, }, }); if (res.ok && res.body.data?.generateVideoToken) { return [ { src: res.body.data.generateVideoToken.p2160?.token, quality: 2160, }, { src: res.body.data.generateVideoToken.p1080?.token, quality: 1080, }, { src: res.body.data.generateVideoToken.p720?.token, quality: 720, }, { src: res.body.data.generateVideoToken.p480?.token, quality: 480, }, { src: res.body.data.generateVideoToken.p360?.token, quality: 360, }, { src: res.body.data.generateVideoToken.p270?.token, quality: 270, }, ]; } return null; } /* async function getPhotosLegacy(url) { const htmlRes = await http.get(url, { extract: { runScripts: 'dangerously', }, }); try { const state = htmlRes?.window?.__APOLLO_STATE__; if (!state) { return []; } const key = Object.values(state?.ROOT_QUERY).find((query) => query?.__ref)?.__ref; const data = state[key]; if (!data) { return []; } return data.carousel.slice(1).map((photo) => photo.main?.[0].src).filter(Boolean); } catch (error) { logger.warn(`Failed to retrieve Vixen images: ${error.message}`); return []; } } */ async function getPhotos(url) { const htmlRes = await http.get(url, { parse: true, extract: { runScripts: 'dangerously', }, }); try { const state = htmlRes?.window?.__APOLLO_STATE__; console.log('state', state); if (!state) { return []; } const key = Object.values(state?.ROOT_QUERY).find((query) => query?.__ref)?.__ref; const data = state[key]; console.log('data', data); if (!data) { return []; } console.log(data.carousel); return data.carousel.slice(1).map((photo) => photo.main?.[0].src).filter(Boolean); } catch (error) { logger.warn(`Failed to retrieve Vixen images: ${error.message}`); return []; } } function scrapeAll(scenes, site, origin) { return scenes.map((scene) => { const release = {}; release.title = scene.title; release.entryId = String(scene.newId); release.url = `${site?.url || origin}/videos${scene.targetUrl}`; release.date = moment.utc(scene.releaseDate).toDate(); release.datePrecision = 'minute'; release.actors = scene.models; release.stars = Number(scene.textRating) / 2; release.poster = getPosterFallbacks(scene.images.poster); release.teaser = getTeaserFallbacks(scene.previews.poster); return release; }); } function scrapeUpcoming(scene, site) { if (!scene || scene.isPreReleasePeriod) return null; const release = {}; release.title = scene.targetUrl .slice(1) .split('-') .map((component) => `${component.charAt(0).toUpperCase()}${component.slice(1)}`) .join(' '); release.url = `${site.url}/videos${scene.targetUrl}`; release.date = moment.utc(scene.releaseDate).toDate(); release.datePrecision = 'minute'; release.actors = scene.models; release.poster = getPosterFallbacks(scene.images.poster); release.teaser = getTeaserFallbacks(scene.previews.poster); release.entryId = (release.poster[0] || release.teaser[0])?.src?.match(/\/(\d+)/)?.[1]; return [release]; } async function scrapeScene(data, url, site, baseRelease, options) { const scene = data.video; const release = { url, title: scene.title, description: scene.description, actors: scene.models, director: scene.directorNames, duration: scene.runLength, stars: scene.totalRateVal, tags: scene.tags, }; release.entryId = scene.newId; release.date = moment.utc(scene.releaseDate).toDate(); release.productionDate = moment.utc(scene.shootDate).toDate(); release.datePrecision = 'minute'; release.actors = baseRelease?.actors || scene.models; release.poster = getPosterFallbacks(scene.images.poster); // release.photos = data.pictureset.map(photo => photo.main[0]?.src).filter(Boolean); if (options.includePhotos) { release.photos = await getPhotos(url); } release.teaser = getTeaserFallbacks(scene.previews.poster); const trailer = await getTrailer(scene, site, url); if (trailer) release.trailer = trailer; release.chapters = data.video.chapters?.video.map((chapter) => ({ tags: [chapter.title], time: chapter.seconds, })); return release; } async function fetchActorReleases(pages, model, origin) { const releasesPerPage = await Promise.map(pages, async (page) => { const url = `${origin}/api${model.targetUrl}?page=${page}`; const res = await http.get(url); if (res.status === 200) { return scrapeAll(res.body.data.videos.videos, null, origin); } return []; }, { concurrency: 3 }); return releasesPerPage.flat(); } async function scrapeProfile(data, origin, withReleases) { const model = data.model; const profile = {}; profile.birthdate = new Date(model.dateOfBirth); profile.gender = genderMap[model.sex]; profile.hair = model.hairColour; profile.nationality = model.nationality; if (model.biography.trim().length > 0) profile.description = model.biography; if (model.cupSize && model.bustMeasurment) profile.bust = `${model.bustMeasurment}${model.cupSize}`; if (model.waistMeasurment) profile.waist = model.waistMeasurment; if (model.hipMeasurment) profile.hip = model.hipMeasurment; profile.avatar = getAvatarFallbacks(model.images.listing); profile.poster = getAvatarFallbacks(model.images.profile); profile.banner = getAvatarFallbacks(model.images.poster); const releases = scrapeAll(data.videos.videos, null, origin); if (withReleases) { const pageCount = Math.ceil(data.videos.count / 6); const otherReleases = await fetchActorReleases((Array.from({ length: pageCount - 1 }, (value, index) => index + 2)), model, origin); profile.releases = [...releases, ...otherReleases]; } else { profile.releases = releases; } return profile; } async function fetchLatest(site, page = 1) { const url = `${site.url}/api/videos?page=${page}`; const res = await http.get(url); if (res.ok) { if (res.body.data.videos) { return scrapeAll(res.body.data.videos, site); } return []; } return res.status; } async function fetchUpcoming(site) { const apiUrl = `${site.url}/api`; const res = await http.get(apiUrl); if (res.ok) { if (res.body.data.nextScene) { return scrapeUpcoming(res.body.data.nextScene, site); } return []; } return res.status; } async function fetchScene(url, site, baseRelease, options) { const { origin, pathname } = new URL(url); const apiUrl = `${origin}/api/${pathname.split('/').slice(-1)[0]}`; const res = await http.get(apiUrl, { extract: { runScripts: 'dangerously', }, }); if (res.ok) { if (res.body.data) { return scrapeScene(res.body.data, url, site, baseRelease, options); } return null; } return res.status; } async function fetchProfile({ name: actorName }, { site }, include) { const origin = site.url; const actorSlug = slugify(actorName); const url = `${origin}/api/${actorSlug}`; const res = await http.get(url); if (res.ok) { if (res.body.data) { return scrapeProfile(res.body.data, origin, include.scenes); } return null; } return res.status; } module.exports = { fetchLatest, fetchUpcoming, fetchScene, fetchProfile, };