Completed Erome module. Added content URL list fetching.

This commit is contained in:
ThePendulum 2019-11-01 05:55:55 +01:00
parent 9a3561b6bc
commit 401a4e2153
5 changed files with 87 additions and 36 deletions

View File

@ -15,6 +15,8 @@ Most features are optional and can easily be disabled!
* Reddit text/self, images and videos[\*](#reddit-videos)
* Imgur (requires API key as of late 2019)
* Gfycat
* Erome
* Vidble
* Eroshare archive
### Plans and ideas

View File

@ -70,33 +70,27 @@ async function getCompletePosts() {
return attachContentInfo(curatedUserPosts);
}
async function getDirectContent(link, ep) {
const host = dissectLink(link);
const info = await getInfo(host);
async function getDirectContent(links, ep) {
return Promise.map(links, async (link) => {
const host = dissectLink(link);
const info = await getInfo(host);
console.log(info);
return fetchSaveDirectContent(info, host, ep);
}, {
concurrency: 5,
});
}
return fetchSaveDirectContent(info, host, ep);
async function getCompleteContents(ep) {
if (args.fetch) {
return getDirectContent([args.fetch], ep);
}
/*
console.log(info);
if (args.fileDirect) {
return getDirectContent(await getFileContents(args.fileDirect, 'direct'), ep);
}
await Promise.all(info.items.map(async (item, index) => {
const stream = await fetchItem(item.url);
if (info.album) {
const filepath = `./output/${host.label}/${host.id} - ${info.album.title}/${index + 1} - ${item.id}${path.extname(url.parse(item.url).pathname)}`;
console.log(filepath);
return saveItem(filepath, stream, item);
}
const filepath = `./output/${host.label}/${item.id}${path.extname(url.parse(item.url).pathname)}`;
console.log(filepath);
return saveItem(filepath, stream, item);
}));
*/
return null;
}
function fetchSavePosts(userPosts, ep) {
@ -107,15 +101,15 @@ function fetchSavePosts(userPosts, ep) {
async function initApp() {
try {
const ep = new exiftool.ExiftoolProcess(exiftoolBin);
await ep.open();
if (args.fetch) {
await getDirectContent(args.fetch, ep);
if (args.fetch || args.fileDirect) {
await getCompleteContents(ep);
return;
}
const userPosts = await getCompletePosts();
await ep.open();
await fetchSavePosts(userPosts, ep);
await ep.close();

View File

@ -29,6 +29,11 @@ function getArgs() {
type: 'string',
alias: 'fetch',
})
.option('file-direct', {
describe: 'Load direct content URLs from file',
type: 'string',
alias: 'file-fetch',
})
.option('limit', {
describe: 'Maximum amount of posts to fetch per supplied user (!), after filtering out ignored, cross- and reposts',
type: 'number',

View File

@ -42,6 +42,10 @@ const hosts = [{
method: 'gfycat',
label: 'gfycat',
pattern: new UrlPattern('http(s)\\://(:server.)gfycat.com/(gifs/detail/)(:id-mobile)(:id-size_restricted)(:id)(.:ext)(?*)'),
}, {
method: 'erome',
label: 'erome',
pattern: new UrlPattern('http(s)\\://(www.)erome.com/a/:id(?*)'),
}, {
method: 'eroshareAlbum',
label: 'eroshare',

View File

@ -1,30 +1,76 @@
'use strict';
const config = require('config');
const fetch = require('node-fetch');
const cheerio = require('cheerio');
const base = 'https://www.erome.com/';
async function erome(host) {
const res = await fetch(`${base}a/${host.id}`);
async function erome(host, post) {
const url = `${base}a/${host.id}`;
const res = await fetch(url);
if (res.ok) {
if (!res.ok) {
throw new Error(`Unable to retrieve info for Erome album '${host.id}' :(`);
}
const html = await res.text();
const $ = cheerio.load(html);
const videoUrls = $('video').toArray().map((videoEl) => {
const sourceHd = $(videoEl).find('source[label="HD"]');
const sourceSd = $(videoEl).find('source[label="SD"]');
console.log(sourceHd.attr('src'));
const title = $('meta[property="og:title"]').attr('content') || $('meta[property="twitter:title"]').attr('content');
return sourceHd ? base + sourceHd.attr('src') : base + sourceSd.attr('src');
const items = $('.media-group').toArray().map((mediaItem) => {
const mediaElement = $(mediaItem);
const videoElement = mediaElement.find('.video video');
const id = mediaElement.attr('id');
const itemTitle = mediaElement.find('h2.media-title').text();
if (videoElement.length) {
const sourceHd = videoElement.find('source[label="HD"]');
const sourceSd = videoElement.find('source[label="SD"]');
return {
id,
title: itemTitle,
url: sourceHd.length ? sourceHd.attr('src') : sourceSd.attr('src'),
type: (sourceHd.length ? sourceHd.attr('type') : sourceSd.attr('type')) || 'video/mp4',
};
}
const img = mediaElement.find('.img-front').attr('data-src');
return {
id,
title: itemTitle,
url: img,
};
});
console.log(videoUrls);
const extract = config.library.extractSingleAlbumItem && (items.length === 1);
if (extract) {
console.log('\x1b[36m%s\x1b[0m', `Extracting single item from album '${url}' (${post ? post.url : 'no post'})`);
}
return {
album: extract ? null : {
id: host.id,
url,
title,
description: null,
datetime: null,
},
items: items.map(item => ({
extracted: extract,
id: item.id,
url: item.url,
title: item.title || title || null,
description: null,
type: item.type || 'image/jpeg',
datetime: null,
})),
};
}
module.exports = erome;