X-Git-Url: https://git.immae.eu/?a=blobdiff_plain;f=server%2Ftools%2Fpeertube-import-videos.ts;h=bbdaa09c0b40dce14026a85cd704bd32538be48c;hb=2c015b54192f2080f756c424173bac2bd53e7ca9;hp=fcb90cca3f30af56493c1cc211d47eca62d23b7a;hpb=8d5e65349deebd499c0be10fe02d535a77d58ddb;p=github%2FChocobozzz%2FPeerTube.git diff --git a/server/tools/peertube-import-videos.ts b/server/tools/peertube-import-videos.ts index fcb90cca3..bbdaa09c0 100644 --- a/server/tools/peertube-import-videos.ts +++ b/server/tools/peertube-import-videos.ts @@ -1,23 +1,21 @@ -// FIXME: https://github.com/nodejs/node/pull/16853 -require('tls').DEFAULT_ECDH_CURVE = 'auto' - -import * as program from 'commander' -import { join } from 'path' -import { doRequestAndSaveToFile } from '../helpers/requests' -import { CONSTRAINTS_FIELDS } from '../initializers/constants' -import { getClient, getVideoCategories, login, searchVideoWithSort, uploadVideo } from '../../shared/extra-utils/index' -import { truncate } from 'lodash' -import * as prompt from 'prompt' +import { program } from 'commander' import { accessSync, constants } from 'fs' import { remove } from 'fs-extra' -import { sha256 } from '../helpers/core-utils' -import { buildOriginallyPublishedAt, safeGetYoutubeDL } from '../helpers/youtube-dl' -import { buildCommonVideoOptions, buildVideoAttributesFromCommander, getServerCredentials, getLogger } from './cli' +import { join } from 'path' +import { YoutubeDLCLI, YoutubeDLInfo, YoutubeDLInfoBuilder } from '@server/helpers/youtube-dl' +import { wait } from '@shared/core-utils' +import { sha256 } from '@shared/extra-utils' +import { doRequestAndSaveToFile } from '../helpers/requests' +import { + assignToken, + buildCommonVideoOptions, + buildServer, + buildVideoAttributesFromCommander, + getLogger, + getServerCredentials +} from './shared' -type UserInfo = { - username: string - password: string -} +import prompt = require('prompt') const processOptions = { maxBuffer: Infinity @@ -37,208 +35,211 @@ command .option('--until ', 'Publication date (inclusive) until which the videos can be imported (YYYY-MM-DD)', parseDate) .option('--first ', 'Process first n elements of returned playlist') .option('--last ', 'Process last n elements of returned playlist') + .option('--wait-interval ', 'Duration between two video imports (in seconds)', convertIntoMs) .option('-T, --tmpdir ', 'Working directory', __dirname) + .usage('[global options] [ -- youtube-dl options]') .parse(process.argv) -let log = getLogger(program[ 'verbose' ]) +const options = command.opts() + +const log = getLogger(options.verbose) getServerCredentials(command) .then(({ url, username, password }) => { - if (!program[ 'targetUrl' ]) { + if (!options.targetUrl) { exitError('--target-url field is required.') } try { - accessSync(program[ 'tmpdir' ], constants.R_OK | constants.W_OK) + accessSync(options.tmpdir, constants.R_OK | constants.W_OK) } catch (e) { - exitError('--tmpdir %s: directory does not exist or is not accessible', program[ 'tmpdir' ]) + exitError('--tmpdir %s: directory does not exist or is not accessible', options.tmpdir) } - removeEndSlashes(url) - removeEndSlashes(program[ 'targetUrl' ]) - - const user = { username, password } + url = normalizeTargetUrl(url) + options.targetUrl = normalizeTargetUrl(options.targetUrl) - run(url, user) - .catch(err => { - exitError(err) - }) + run(url, username, password) + .catch(err => exitError(err)) }) + .catch(err => console.error(err)) -async function run (url: string, user: UserInfo) { - if (!user.password) { - user.password = await promptPassword() - } +async function run (url: string, username: string, password: string) { + if (!password) password = await promptPassword() - const youtubeDL = await safeGetYoutubeDL() + const youtubeDLBinary = await YoutubeDLCLI.safeGet() - const options = [ '-j', '--flat-playlist', '--playlist-reverse' ] - youtubeDL.getInfo(program[ 'targetUrl' ], options, processOptions, async (err, info) => { - if (err) { - exitError(err.message) - } + let info = await getYoutubeDLInfo(youtubeDLBinary, options.targetUrl, command.args) - let infoArray: any[] + if (!Array.isArray(info)) info = [ info ] - // Normalize utf8 fields - infoArray = [].concat(info); - if (program[ 'first' ]) { - infoArray = infoArray.slice(0, program[ 'first' ]) - } else if (program[ 'last' ]) { - infoArray = infoArray.slice(- program[ 'last' ]) - } - infoArray = infoArray.map(i => normalizeObject(i)) + // Try to fix youtube channels upload + const uploadsObject = info.find(i => !i.ie_key && !i.duration && i.title === 'Uploads') + + if (uploadsObject) { + console.log('Fixing URL to %s.', uploadsObject.url) + + info = await getYoutubeDLInfo(youtubeDLBinary, uploadsObject.url, command.args) + } + + let infoArray: any[] - log.info('Will download and upload %d videos.\n', infoArray.length) + infoArray = [].concat(info) + if (options.first) { + infoArray = infoArray.slice(0, options.first) + } else if (options.last) { + infoArray = infoArray.slice(-options.last) + } + + log.info('Will download and upload %d videos.\n', infoArray.length) + + let skipInterval = true + for (const [ index, info ] of infoArray.entries()) { + try { + if (index > 0 && options.waitInterval && !skipInterval) { + log.info('Wait for %d seconds before continuing.', options.waitInterval / 1000) + await wait(options.waitInterval) + } - for (const info of infoArray) { - await processVideo({ - cwd: program[ 'tmpdir' ], + skipInterval = await processVideo({ + cwd: options.tmpdir, url, - user, + username, + password, youtubeInfo: info }) + } catch (err) { + console.error('Cannot process video.', { info, url, err }) } + } - log.info('Video/s for user %s imported: %s', user.username, program[ 'targetUrl' ]) - process.exit(0) - }) + log.info('Video/s for user %s imported: %s', username, options.targetUrl) + process.exit(0) } -function processVideo (parameters: { - cwd: string, - url: string, - user: { username: string, password: string }, +async function processVideo (parameters: { + cwd: string + url: string + username: string + password: string youtubeInfo: any }) { - const { youtubeInfo, cwd, url, user } = parameters + const { youtubeInfo, cwd, url, username, password } = parameters - return new Promise(async res => { - log.debug('Fetching object.', youtubeInfo) + log.debug('Fetching object.', youtubeInfo) - const videoInfo = await fetchObject(youtubeInfo) - log.debug('Fetched object.', videoInfo) + const videoInfo = await fetchObject(youtubeInfo) + log.debug('Fetched object.', videoInfo) - if (program[ 'since' ]) { - if (buildOriginallyPublishedAt(videoInfo).getTime() < program[ 'since' ].getTime()) { - log.info('Video "%s" has been published before "%s", don\'t upload it.\n', - videoInfo.title, formatDate(program[ 'since' ])); - return res(); - } - } - if (program[ 'until' ]) { - if (buildOriginallyPublishedAt(videoInfo).getTime() > program[ 'until' ].getTime()) { - log.info('Video "%s" has been published after "%s", don\'t upload it.\n', - videoInfo.title, formatDate(program[ 'until' ])); - return res(); - } + if ( + options.since && + videoInfo.originallyPublishedAtWithoutTime && + videoInfo.originallyPublishedAtWithoutTime.getTime() < options.since.getTime() + ) { + log.info('Video "%s" has been published before "%s", don\'t upload it.\n', videoInfo.name, formatDate(options.since)) + return true + } + + if ( + options.until && + videoInfo.originallyPublishedAtWithoutTime && + videoInfo.originallyPublishedAtWithoutTime.getTime() > options.until.getTime() + ) { + log.info('Video "%s" has been published after "%s", don\'t upload it.\n', videoInfo.name, formatDate(options.until)) + return true + } + + const server = buildServer(url) + const { data } = await server.search.advancedVideoSearch({ + search: { + search: videoInfo.name, + sort: '-match', + searchTarget: 'local' } + }) - const result = await searchVideoWithSort(url, videoInfo.title, '-match') + log.info('############################################################\n') - log.info('############################################################\n') + if (data.find(v => v.name === videoInfo.name)) { + log.info('Video "%s" already exists, don\'t reupload it.\n', videoInfo.name) + return true + } - if (result.body.data.find(v => v.name === videoInfo.title)) { - log.info('Video "%s" already exists, don\'t reupload it.\n', videoInfo.title) - return res() - } + const path = join(cwd, sha256(videoInfo.url) + '.mp4') - const path = join(cwd, sha256(videoInfo.url) + '.mp4') + log.info('Downloading video "%s"...', videoInfo.name) - log.info('Downloading video "%s"...', videoInfo.title) + try { + const youtubeDLBinary = await YoutubeDLCLI.safeGet() + const output = await youtubeDLBinary.download({ + url: videoInfo.url, + format: YoutubeDLCLI.getYoutubeDLVideoFormat([], false), + output: path, + additionalYoutubeDLArgs: command.args, + processOptions + }) - const options = [ '-f', 'bestvideo[ext=mp4]+bestaudio[ext=m4a]/best', '-o', path ] - try { - const youtubeDL = await safeGetYoutubeDL() - youtubeDL.exec(videoInfo.url, options, processOptions, async (err, output) => { - if (err) { - log.error(err) - return res() - } + log.info(output.join('\n')) + await uploadVideoOnPeerTube({ + cwd, + url, + username, + password, + videoInfo, + videoPath: path + }) + } catch (err) { + log.error(err.message) + } - log.info(output.join('\n')) - await uploadVideoOnPeerTube({ - cwd, - url, - user, - videoInfo: normalizeObject(videoInfo), - videoPath: path - }) - return res() - }) - } catch (err) { - log.error(err.message) - return res() - } - }) + return false } async function uploadVideoOnPeerTube (parameters: { - videoInfo: any, - videoPath: string, - cwd: string, - url: string, - user: { username: string; password: string } + videoInfo: YoutubeDLInfo + videoPath: string + cwd: string + url: string + username: string + password: string }) { - const { videoInfo, videoPath, cwd, url, user } = parameters - - const category = await getCategory(videoInfo.categories, url) - const licence = getLicence(videoInfo.license) - let tags = [] - if (Array.isArray(videoInfo.tags)) { - tags = videoInfo.tags - .filter(t => t.length < CONSTRAINTS_FIELDS.VIDEOS.TAG.max && t.length > CONSTRAINTS_FIELDS.VIDEOS.TAG.min) - .map(t => t.normalize()) - .slice(0, 5) - } + const { videoInfo, videoPath, cwd, url, username, password } = parameters - let thumbnailfile - if (videoInfo.thumbnail) { - thumbnailfile = join(cwd, sha256(videoInfo.thumbnail) + '.jpg') + const server = buildServer(url) + await assignToken(server, username, password) - await doRequestAndSaveToFile({ - method: 'GET', - uri: videoInfo.thumbnail - }, thumbnailfile) - } + let thumbnailfile: string + if (videoInfo.thumbnailUrl) { + thumbnailfile = join(cwd, sha256(videoInfo.thumbnailUrl) + '.jpg') - const originallyPublishedAt = buildOriginallyPublishedAt(videoInfo) - - const defaultAttributes = { - name: truncate(videoInfo.title, { - 'length': CONSTRAINTS_FIELDS.VIDEOS.NAME.max, - 'separator': /,? +/, - 'omission': ' […]' - }), - category, - licence, - nsfw: isNSFW(videoInfo), - description: videoInfo.description, - tags + await doRequestAndSaveToFile(videoInfo.thumbnailUrl, thumbnailfile) } - const videoAttributes = await buildVideoAttributesFromCommander(url, program, defaultAttributes) + const baseAttributes = await buildVideoAttributesFromCommander(server, program, videoInfo) + + const attributes = { + ...baseAttributes, + + originallyPublishedAtWithoutTime: videoInfo.originallyPublishedAtWithoutTime + ? videoInfo.originallyPublishedAtWithoutTime.toISOString() + : null, - Object.assign(videoAttributes, { - originallyPublishedAt: originallyPublishedAt ? originallyPublishedAt.toISOString() : null, thumbnailfile, previewfile: thumbnailfile, fixture: videoPath - }) - - log.info('\nUploading on PeerTube video "%s".', videoAttributes.name) + } - let accessToken = await getAccessTokenOrDie(url, user) + log.info('\nUploading on PeerTube video "%s".', attributes.name) try { - await uploadVideo(url, accessToken, videoAttributes) + await server.videos.upload({ attributes }) } catch (err) { if (err.message.indexOf('401') !== -1) { log.info('Got 401 Unauthorized, token may have expired, renewing token and retry.') - accessToken = await getAccessTokenOrDie(url, user) + server.accessToken = await server.login.getAccessToken(username, password) - await uploadVideo(url, accessToken, videoAttributes) + await server.videos.upload({ attributes }) } else { exitError(err.message) } @@ -247,89 +248,47 @@ async function uploadVideoOnPeerTube (parameters: { await remove(videoPath) if (thumbnailfile) await remove(thumbnailfile) - log.warn('Uploaded video "%s"!\n', videoAttributes.name) + log.info('Uploaded video "%s"!\n', attributes.name) } /* ---------------------------------------------------------- */ -async function getCategory (categories: string[], url: string) { - if (!categories) return undefined - - const categoryString = categories[ 0 ] - - if (categoryString === 'News & Politics') return 11 - - const res = await getVideoCategories(url) - const categoriesServer = res.body - - for (const key of Object.keys(categoriesServer)) { - const categoryServer = categoriesServer[ key ] - if (categoryString.toLowerCase() === categoryServer.toLowerCase()) return parseInt(key, 10) - } - - return undefined -} - -function getLicence (licence: string) { - if (!licence) return undefined - - if (licence.indexOf('Creative Commons Attribution licence') !== -1) return 1 - - return undefined -} - -function normalizeObject (obj: any) { - const newObj: any = {} - - for (const key of Object.keys(obj)) { - // Deprecated key - if (key === 'resolution') continue - - const value = obj[ key ] - - if (typeof value === 'string') { - newObj[ key ] = value.normalize() - } else { - newObj[ key ] = value - } - } +async function fetchObject (info: any) { + const url = buildUrl(info) - return newObj -} + const youtubeDLCLI = await YoutubeDLCLI.safeGet() + const result = await youtubeDLCLI.getInfo({ + url, + format: YoutubeDLCLI.getYoutubeDLVideoFormat([], false), + processOptions + }) -function fetchObject (info: any) { - const url = buildUrl(info) + const builder = new YoutubeDLInfoBuilder(result) - return new Promise(async (res, rej) => { - const youtubeDL = await safeGetYoutubeDL() - youtubeDL.getInfo(url, undefined, processOptions, async (err, videoInfo) => { - if (err) return rej(err) + const videoInfo = builder.getInfo() - const videoInfoWithUrl = Object.assign(videoInfo, { url }) - return res(normalizeObject(videoInfoWithUrl)) - }) - }) + return { ...videoInfo, url } } function buildUrl (info: any) { const webpageUrl = info.webpage_url as string - if (webpageUrl && webpageUrl.match(/^https?:\/\//)) return webpageUrl + if (webpageUrl?.match(/^https?:\/\//)) return webpageUrl const url = info.url as string - if (url && url.match(/^https?:\/\//)) return url + if (url?.match(/^https?:\/\//)) return url // It seems youtube-dl does not return the video url return 'https://www.youtube.com/watch?v=' + info.id } -function isNSFW (info: any) { - return info.age_limit && info.age_limit >= 16 -} +function normalizeTargetUrl (url: string) { + let normalizedUrl = url.replace(/\/+$/, '') -function removeEndSlashes (url: string) { - while (url.endsWith('/')) { - url.slice(0, -1) + if (!normalizedUrl.startsWith('http://') && !normalizedUrl.startsWith('https://')) { + normalizedUrl = 'https://' + normalizedUrl } + + return normalizedUrl } async function promptPassword () { @@ -352,38 +311,41 @@ async function promptPassword () { }) } -async function getAccessTokenOrDie (url: string, user: UserInfo) { - const resClient = await getClient(url) - const client = { - id: resClient.body.client_id, - secret: resClient.body.client_secret - } - - try { - const res = await login(url, client, user) - return res.body.access_token - } catch (err) { - exitError('Cannot authenticate. Please check your username/password.') - } -} - function parseDate (dateAsStr: string): Date { if (!/\d{4}-\d{2}-\d{2}/.test(dateAsStr)) { - exitError(`Invalid date passed: ${dateAsStr}. Expected format: YYYY-MM-DD. See help for usage.`); + exitError(`Invalid date passed: ${dateAsStr}. Expected format: YYYY-MM-DD. See help for usage.`) } - const date = new Date(dateAsStr); + const date = new Date(dateAsStr) + date.setHours(0, 0, 0) if (isNaN(date.getTime())) { - exitError(`Invalid date passed: ${dateAsStr}. See help for usage.`); + exitError(`Invalid date passed: ${dateAsStr}. See help for usage.`) } - return date; + return date } function formatDate (date: Date): string { - return date.toISOString().split('T')[0]; + return date.toISOString().split('T')[0] } -function exitError (message:string, ...meta: any[]) { +function convertIntoMs (secondsAsStr: string): number { + const seconds = parseInt(secondsAsStr, 10) + if (seconds <= 0) { + exitError(`Invalid duration passed: ${seconds}. Expected duration to be strictly positive and in seconds`) + } + return Math.round(seconds * 1000) +} + +function exitError (message: string, ...meta: any[]) { // use console.error instead of log.error here console.error(message, ...meta) process.exit(-1) } + +function getYoutubeDLInfo (youtubeDLCLI: YoutubeDLCLI, url: string, args: string[]) { + return youtubeDLCLI.getInfo({ + url, + format: YoutubeDLCLI.getYoutubeDLVideoFormat([], false), + additionalYoutubeDLArgs: [ '-j', '--flat-playlist', '--playlist-reverse', ...args ], + processOptions + }) +}