Added Blowpass scraper. Split shootId and pageId.

This commit is contained in:
2019-04-06 23:24:26 +02:00
parent 069c2c1628
commit 3a90f98d41
14 changed files with 208 additions and 11 deletions

View File

@@ -25,13 +25,14 @@ function scrapeLatest(html, site) {
const originalTitle = sceneLinkElement.text().trim(); // title attribute breaks when they use \\ escaping
const { shootId, title } = extractTitle(originalTitle);
const internalId = new URL(url).pathname.split('/')[2];
const entryId = new URL(url).pathname.split('/')[2];
const date = moment.utc($(element).attr('release'), 'YYYY/MM/DD').toDate();
return {
url,
shootId: shootId || internalId,
shootId,
entryId,
title,
date,
site,
@@ -44,6 +45,7 @@ async function scrapeScene(html, url, site) {
const originalTitle = $('h1.watchpage-title').text().trim();
const { shootId, title } = extractTitle(originalTitle);
const entryId = new URL(url).pathname.split('/')[2];
const date = moment.utc($('span[title="Release date"] a').text(), 'YYYY-MM-DD').toDate();
@@ -60,6 +62,7 @@ async function scrapeScene(html, url, site) {
return {
url,
shootId,
entryId,
title,
date,
actors,