Added Inn of Sinn, added Lil Sis to Nubiles.

This commit is contained in:
DebaucheryLibrarian
2023-12-06 00:15:55 +01:00
parent 655cbf50f3
commit a3c064be55
117 changed files with 558 additions and 83 deletions

100
src/scrapers/innofsin.js Executable file
View File

@@ -0,0 +1,100 @@
'use strict';
const unprint = require('unprint');
const slugify = require('../utils/slugify');
function scrapeAll(scenes) {
return scenes.map(({ query }) => {
const release = {};
release.url = query.url('a');
release.entryId = new URL(release.url).pathname.replaceAll('/', '');
release.title = query.content('h2 a');
release.date = query.date('.date', 'MMM DD, YYYY');
release.actors = query.content('.modelname').split(',').filter(Boolean);
release.poster = query.img('.imgc img');
release.teaser = query.video('.vidhover source');
console.log(release);
return release;
});
}
function scrapeScene({ query }, { url }) {
const release = {};
release.entryId = new URL(url).pathname.replaceAll('/', '');
release.title = query.content('.vid-box h1');
release.description = query.content('//div[contains(@class, "vid-box")]/*[contains(text(), "About")]/following-sibling::p[2]');
release.actors = query.all('.vid-box a[href*="/pornstars"]').map((actorEl) => ({
name: unprint.query.content(actorEl),
url: unprint.query.url(actorEl, null),
}));
release.poster = query.poster('.vid-play video');
release.photos = query.imgs('.img-sample img').map((source) => [
source.replace(/-\d+x\d+/, ''), // usually same size, but try anyway
source,
]);
release.tags = query.contents('.vid-box [itemprop="keywords"] a');
release.trailer = query.video('.vid-play source');
console.log(release);
return release;
}
function scrapeProfile({ query }, actorName, entity, include) {
const profile = {};
profile.description = query.cnt('.bio-text');
profile.birthPlace = query.cnt('.birth-place span');
profile.avatar = query.img('.actor-photo img');
if (include.releases) {
return scrapeAll(unprint.initAll(query.all('.scene')));
}
console.log(profile);
return profile;
}
async function fetchLatest(channel, page = 1) {
const url = `${channel.url}/videos/page/${page}/`;
const res = await unprint.get(url, { selectAll: '.vid-listing li' });
if (res.ok) {
return scrapeAll(res.context, channel);
}
return res.status;
}
async function fetchProfile({ name: actorName }, entity, include) {
const url = `${entity.url}/actors/${slugify(actorName, '_')}`;
const res = await unprint.get(url);
if (res.ok) {
return scrapeProfile(res.item, actorName, entity, include);
}
return res.status;
}
module.exports = {
fetchLatest,
fetchProfile,
scrapeScene: {
scraper: scrapeScene,
unprint: true,
},
};

View File

@@ -25,6 +25,7 @@ const gamma = require('./gamma');
const hitzefrei = require('./hitzefrei');
const hookuphotshot = require('./hookuphotshot');
const hush = require('./hush');
const innofsin = require('./innofsin');
const insex = require('./insex');
const inthecrack = require('./inthecrack');
const jayrock = require('./jayrock');
@@ -111,6 +112,7 @@ const scrapers = {
hookuphotshot,
hussiepass: hush,
hushpass: hush,
innofsin,
insex,
interracialpass: hush,
inthecrack,

View File

@@ -1,6 +1,7 @@
'use strict';
const qu = require('../utils/q');
const unprint = require('unprint');
const slugify = require('../utils/slugify');
function scrapeAll(scenes) {
@@ -10,11 +11,11 @@ function scrapeAll(scenes) {
release.url = query.url('.title a');
release.entryId = new URL(release.url).pathname.match(/\/scene\/(\d+)/)[1];
release.title = query.cnt('.title a');
release.description = query.cnt('.description');
release.title = query.content('.title a');
release.description = query.content('.description');
release.date = query.date('.date', 'MMM DD, YYYY');
release.actors = query.cnts('.models a.model');
release.actors = query.contents('.models a.model');
release.poster = query.img('img.poster');
release.teaser = { src: query.video('.teaser video') };
@@ -32,26 +33,26 @@ function scrapeScene({ query }, url) {
release.entryId = new URL(url).pathname.match(/\/scene\/(\d+)/)[1];
release.title = query.cnt('h3.title');
release.description = query.cnt('p.description');
release.title = query.content('h3.title');
release.description = query.content('p.description');
[release.poster, ...release.photos] = query.imgs('.preview-thumb');
release.trailer = { src: query.video('.trailer video') };
release.trailer = query.video('.trailer video');
console.log(release);
return release;
}
function scrapeProfile({ query, el }, actorName, entity, include) {
function scrapeProfile({ query }, actorName, entity, include) {
const profile = {};
profile.description = query.cnt('.bio-text');
profile.birthPlace = query.cnt('.birth-place span');
profile.description = query.content('.bio-text');
profile.birthPlace = query.content('.birth-place span');
profile.avatar = query.img('.actor-photo img');
if (include.releases) {
return scrapeAll(qu.initAll(el, '.scene'));
return scrapeAll(unprint.initAll(query.all('.scene')));
}
console.log(profile);
@@ -60,20 +61,20 @@ function scrapeProfile({ query, el }, actorName, entity, include) {
async function fetchLatest(channel, page = 1) {
const url = `${channel.url}/${page}`;
const res = await qu.getAll(url, '.scene');
const res = await unprint.get(url, { selectAll: '.scene' });
if (res.ok) {
return scrapeAll(res.items, channel);
return scrapeAll(res.context, channel);
}
return res.status;
}
async function fetchScene(url, channel) {
const res = await qu.get(url);
const res = await unprint.get(url);
if (res.ok) {
return scrapeScene(res.item, url, channel);
return scrapeScene(res.context, url, channel);
}
return res.status;
@@ -81,10 +82,10 @@ async function fetchScene(url, channel) {
async function fetchProfile({ name: actorName }, entity, include) {
const url = `${entity.url}/actors/${slugify(actorName, '_')}`;
const res = await qu.get(url);
const res = await unprint.get(url);
if (res.ok) {
return scrapeProfile(res.item, actorName, entity, include);
return scrapeProfile(res.context, actorName, entity, include);
}
return res.status;

View File

@@ -85,7 +85,7 @@ async function matchReleaseTags(releases) {
)];
const tagEntries = await knex('tags')
.select('tags.id', 'tags.name', 'tags.alias_for')
.select('tags.id', 'tags.name', 'tags.alias_for', 'tags.implied_tag_ids')
.whereIn('tags.name', casedTags);
const tagIdsBySlug = tagEntries