]> git.immae.eu Git - github/Chocobozzz/PeerTube.git/blame - server/helpers/ffmpeg-utils.ts
Add tests for video downscale framerate matching
[github/Chocobozzz/PeerTube.git] / server / helpers / ffmpeg-utils.ts
CommitLineData
14d3270f 1import * as ffmpeg from 'fluent-ffmpeg'
09209296 2import { dirname, join } from 'path'
5ba49f26 3import { getTargetBitrate, getMaxBitrate, VideoResolution } from '../../shared/models/videos'
6dd9de95 4import { FFMPEG_NICE, VIDEO_TRANSCODING_FPS } from '../initializers/constants'
26670720 5import { processImage } from './image-utils'
6fdc553a 6import { logger } from './logger'
e5565833 7import { checkFFmpegEncoders } from '../initializers/checker-before-init'
6dd9de95
C
8import { readFile, remove, writeFile } from 'fs-extra'
9import { CONFIG } from '../initializers/config'
14d3270f 10
06215f15
C
11function computeResolutionsToTranscode (videoFileHeight: number) {
12 const resolutionsEnabled: number[] = []
13 const configResolutions = CONFIG.TRANSCODING.RESOLUTIONS
14
15 // Put in the order we want to proceed jobs
16 const resolutions = [
5c7d6508 17 VideoResolution.H_NOVIDEO,
06215f15
C
18 VideoResolution.H_480P,
19 VideoResolution.H_360P,
20 VideoResolution.H_720P,
21 VideoResolution.H_240P,
ad3405d0
C
22 VideoResolution.H_1080P,
23 VideoResolution.H_4K
06215f15
C
24 ]
25
26 for (const resolution of resolutions) {
27 if (configResolutions[ resolution + 'p' ] === true && videoFileHeight > resolution) {
28 resolutionsEnabled.push(resolution)
29 }
30 }
31
32 return resolutionsEnabled
33}
34
52201311 35async function getVideoStreamSize (path: string) {
5ba49f26 36 const videoStream = await getVideoStreamFromFile(path)
056aa7f2 37
3a149e9f
C
38 return videoStream === null
39 ? { width: 0, height: 0 }
40 : { width: videoStream.width, height: videoStream.height }
09209296
C
41}
42
52201311
C
43async function getVideoStreamCodec (path: string) {
44 const videoStream = await getVideoStreamFromFile(path)
45
46 if (!videoStream) return ''
47
48 const videoCodec = videoStream.codec_tag_string
49
50 const baseProfileMatrix = {
51 'High': '6400',
52 'Main': '4D40',
53 'Baseline': '42E0'
54 }
55
56 let baseProfile = baseProfileMatrix[videoStream.profile]
57 if (!baseProfile) {
58 logger.warn('Cannot get video profile codec of %s.', path, { videoStream })
59 baseProfile = baseProfileMatrix['High'] // Fallback
60 }
61
62 const level = videoStream.level.toString(16)
63
64 return `${videoCodec}.${baseProfile}${level}`
65}
66
67async function getAudioStreamCodec (path: string) {
68 const { audioStream } = await audio.get(path)
69
70 if (!audioStream) return ''
71
72 const audioCodec = audioStream.codec_name
49c3bf6f 73 if (audioCodec === 'aac') return 'mp4a.40.2'
52201311
C
74
75 logger.warn('Cannot get audio codec of %s.', path, { audioStream })
76
77 return 'mp4a.40.2' // Fallback
78}
79
09209296 80async function getVideoFileResolution (path: string) {
52201311 81 const size = await getVideoStreamSize(path)
09209296
C
82
83 return {
84 videoFileResolution: Math.min(size.height, size.width),
85 isPortraitMode: size.height > size.width
056aa7f2 86 }
73c69591 87}
14d3270f 88
73c69591 89async function getVideoFileFPS (path: string) {
5ba49f26 90 const videoStream = await getVideoStreamFromFile(path)
3a149e9f 91 if (videoStream === null) return 0
5c7d6508 92
ef04ae20 93 for (const key of [ 'avg_frame_rate', 'r_frame_rate' ]) {
3a149e9f 94 const valuesText: string = videoStream[ key ]
73c69591
C
95 if (!valuesText) continue
96
97 const [ frames, seconds ] = valuesText.split('/')
98 if (!frames || !seconds) continue
99
100 const result = parseInt(frames, 10) / parseInt(seconds, 10)
3a6f351b 101 if (result > 0) return Math.round(result)
73c69591
C
102 }
103
104 return 0
14d3270f
C
105}
106
edb4ffc7
FA
107async function getVideoFileBitrate (path: string) {
108 return new Promise<number>((res, rej) => {
109 ffmpeg.ffprobe(path, (err, metadata) => {
110 if (err) return rej(err)
111
112 return res(metadata.format.bit_rate)
113 })
114 })
115}
116
14d3270f
C
117function getDurationFromVideoFile (path: string) {
118 return new Promise<number>((res, rej) => {
119 ffmpeg.ffprobe(path, (err, metadata) => {
120 if (err) return rej(err)
121
122 return res(Math.floor(metadata.format.duration))
123 })
124 })
125}
126
26670720
C
127async function generateImageFromVideoFile (fromPath: string, folder: string, imageName: string, size: { width: number, height: number }) {
128 const pendingImageName = 'pending-' + imageName
129
14d3270f 130 const options = {
26670720 131 filename: pendingImageName,
14d3270f
C
132 count: 1,
133 folder
134 }
135
26670720 136 const pendingImagePath = join(folder, pendingImageName)
6fdc553a
C
137
138 try {
139 await new Promise<string>((res, rej) => {
7160878c 140 ffmpeg(fromPath, { niceness: FFMPEG_NICE.THUMBNAIL })
6fdc553a
C
141 .on('error', rej)
142 .on('end', () => res(imageName))
143 .thumbnail(options)
144 })
145
146 const destination = join(folder, imageName)
2fb5b3a5 147 await processImage(pendingImagePath, destination, size)
6fdc553a 148 } catch (err) {
d5b7d911 149 logger.error('Cannot generate image from video %s.', fromPath, { err })
6fdc553a
C
150
151 try {
62689b94 152 await remove(pendingImagePath)
6fdc553a 153 } catch (err) {
d5b7d911 154 logger.debug('Cannot remove pending image path after generation error.', { err })
6fdc553a
C
155 }
156 }
14d3270f
C
157}
158
3a149e9f 159type TranscodeOptionsType = 'hls' | 'quick-transcode' | 'video' | 'merge-audio' | 'only-audio'
536598cf
C
160
161interface BaseTranscodeOptions {
162 type: TranscodeOptionsType
14d3270f
C
163 inputPath: string
164 outputPath: string
09209296 165 resolution: VideoResolution
056aa7f2 166 isPortraitMode?: boolean
536598cf 167}
09209296 168
536598cf
C
169interface HLSTranscodeOptions extends BaseTranscodeOptions {
170 type: 'hls'
d7a25329 171 copyCodecs: boolean
536598cf 172 hlsPlaylist: {
4c280004
C
173 videoFilename: string
174 }
14d3270f
C
175}
176
536598cf
C
177interface QuickTranscodeOptions extends BaseTranscodeOptions {
178 type: 'quick-transcode'
179}
180
181interface VideoTranscodeOptions extends BaseTranscodeOptions {
182 type: 'video'
183}
184
185interface MergeAudioTranscodeOptions extends BaseTranscodeOptions {
186 type: 'merge-audio'
187 audioPath: string
188}
189
3a149e9f
C
190interface OnlyAudioTranscodeOptions extends BaseTranscodeOptions {
191 type: 'only-audio'
5c7d6508 192}
193
3a149e9f
C
194type TranscodeOptions = HLSTranscodeOptions
195 | VideoTranscodeOptions
196 | MergeAudioTranscodeOptions
197 | OnlyAudioTranscodeOptions
198 | QuickTranscodeOptions
536598cf 199
14d3270f 200function transcode (options: TranscodeOptions) {
73c69591 201 return new Promise<void>(async (res, rej) => {
cdf4cb9e 202 try {
cdf4cb9e
C
203 let command = ffmpeg(options.inputPath, { niceness: FFMPEG_NICE.TRANSCODING })
204 .output(options.outputPath)
14aed608 205
536598cf
C
206 if (options.type === 'quick-transcode') {
207 command = await buildQuickTranscodeCommand(command)
208 } else if (options.type === 'hls') {
14aed608 209 command = await buildHLSCommand(command, options)
536598cf
C
210 } else if (options.type === 'merge-audio') {
211 command = await buildAudioMergeCommand(command, options)
3a149e9f
C
212 } else if (options.type === 'only-audio') {
213 command = await buildOnlyAudioCommand(command, options)
14aed608
C
214 } else {
215 command = await buildx264Command(command, options)
216 }
7160878c 217
cdf4cb9e
C
218 if (CONFIG.TRANSCODING.THREADS > 0) {
219 // if we don't set any threads ffmpeg will chose automatically
220 command = command.outputOption('-threads ' + CONFIG.TRANSCODING.THREADS)
221 }
14d3270f 222
cdf4cb9e
C
223 command
224 .on('error', (err, stdout, stderr) => {
225 logger.error('Error in transcoding job.', { stdout, stderr })
226 return rej(err)
227 })
7f8f8bdb 228 .on('end', () => {
536598cf 229 return fixHLSPlaylistIfNeeded(options)
7f8f8bdb
C
230 .then(() => res())
231 .catch(err => rej(err))
232 })
cdf4cb9e
C
233 .run()
234 } catch (err) {
235 return rej(err)
236 }
14d3270f
C
237 })
238}
239
7ed2c1a4 240async function canDoQuickTranscode (path: string): Promise<boolean> {
5ba49f26
FA
241 // NOTE: This could be optimized by running ffprobe only once (but it runs fast anyway)
242 const videoStream = await getVideoStreamFromFile(path)
243 const parsedAudio = await audio.get(path)
244 const fps = await getVideoFileFPS(path)
245 const bitRate = await getVideoFileBitrate(path)
246 const resolution = await getVideoFileResolution(path)
247
248 // check video params
5c7d6508 249 if (videoStream == null) return false
1600235a 250 if (videoStream[ 'codec_name' ] !== 'h264') return false
f6e0de3f 251 if (videoStream[ 'pix_fmt' ] !== 'yuv420p') return false
1600235a
C
252 if (fps < VIDEO_TRANSCODING_FPS.MIN || fps > VIDEO_TRANSCODING_FPS.MAX) return false
253 if (bitRate > getMaxBitrate(resolution.videoFileResolution, fps, VIDEO_TRANSCODING_FPS)) return false
5ba49f26 254
3a149e9f 255 // check audio params (if audio stream exists)
5ba49f26 256 if (parsedAudio.audioStream) {
1600235a
C
257 if (parsedAudio.audioStream[ 'codec_name' ] !== 'aac') return false
258
5ba49f26 259 const maxAudioBitrate = audio.bitrate[ 'aac' ](parsedAudio.audioStream[ 'bit_rate' ])
1600235a 260 if (maxAudioBitrate !== -1 && parsedAudio.audioStream[ 'bit_rate' ] > maxAudioBitrate) return false
5ba49f26 261 }
7ed2c1a4 262
5ba49f26
FA
263 return true
264}
265
837666fe
RK
266function getClosestFramerateStandard (fps: number, hd = false): number {
267 return VIDEO_TRANSCODING_FPS[hd ? 'HD_STANDARD' : 'STANDARD'].slice(0).sort((a, b) => fps % a - fps % b)[0]
268}
269
14d3270f
C
270// ---------------------------------------------------------------------------
271
272export {
52201311
C
273 getVideoStreamCodec,
274 getAudioStreamCodec,
275 getVideoStreamSize,
056aa7f2 276 getVideoFileResolution,
14d3270f
C
277 getDurationFromVideoFile,
278 generateImageFromVideoFile,
536598cf
C
279 TranscodeOptions,
280 TranscodeOptionsType,
73c69591 281 transcode,
7160878c 282 getVideoFileFPS,
06215f15 283 computeResolutionsToTranscode,
edb4ffc7 284 audio,
5ba49f26
FA
285 getVideoFileBitrate,
286 canDoQuickTranscode
73c69591
C
287}
288
289// ---------------------------------------------------------------------------
290
d7a25329 291async function buildx264Command (command: ffmpeg.FfmpegCommand, options: TranscodeOptions) {
14aed608 292 let fps = await getVideoFileFPS(options.inputPath)
14aed608 293 if (
06bcfbd9 294 // On small/medium resolutions, limit FPS
14aed608
C
295 options.resolution !== undefined &&
296 options.resolution < VIDEO_TRANSCODING_FPS.KEEP_ORIGIN_FPS_RESOLUTION_MIN &&
06bcfbd9 297 fps > VIDEO_TRANSCODING_FPS.AVERAGE ||
837666fe
RK
298 // If the video is doesn't match hd standard
299 !VIDEO_TRANSCODING_FPS.HD_STANDARD.some(value => fps % value === 0)
14aed608 300 ) {
06bcfbd9 301 // Get closest standard framerate by modulo: downsampling has to be done to a divisor of the nominal fps value
837666fe 302 fps = getClosestFramerateStandard(fps)
14aed608
C
303 }
304
536598cf 305 command = await presetH264(command, options.inputPath, options.resolution, fps)
14aed608
C
306
307 if (options.resolution !== undefined) {
308 // '?x720' or '720x?' for example
309 const size = options.isPortraitMode === true ? `${options.resolution}x?` : `?x${options.resolution}`
310 command = command.size(size)
311 }
312
313 if (fps) {
314 // Hard FPS limits
837666fe 315 if (fps > VIDEO_TRANSCODING_FPS.MAX) fps = getClosestFramerateStandard(fps, true)
14aed608
C
316 else if (fps < VIDEO_TRANSCODING_FPS.MIN) fps = VIDEO_TRANSCODING_FPS.MIN
317
318 command = command.withFPS(fps)
319 }
320
321 return command
322}
323
536598cf
C
324async function buildAudioMergeCommand (command: ffmpeg.FfmpegCommand, options: MergeAudioTranscodeOptions) {
325 command = command.loop(undefined)
326
327 command = await presetH264VeryFast(command, options.audioPath, options.resolution)
328
329 command = command.input(options.audioPath)
330 .videoFilter('scale=trunc(iw/2)*2:trunc(ih/2)*2') // Avoid "height not divisible by 2" error
331 .outputOption('-tune stillimage')
332 .outputOption('-shortest')
333
334 return command
335}
336
3a149e9f
C
337async function buildOnlyAudioCommand (command: ffmpeg.FfmpegCommand, options: OnlyAudioTranscodeOptions) {
338 command = await presetOnlyAudio(command)
5c7d6508 339
340 return command
341}
342
536598cf
C
343async function buildQuickTranscodeCommand (command: ffmpeg.FfmpegCommand) {
344 command = await presetCopy(command)
345
346 command = command.outputOption('-map_metadata -1') // strip all metadata
347 .outputOption('-movflags faststart')
348
349 return command
350}
351
352async function buildHLSCommand (command: ffmpeg.FfmpegCommand, options: HLSTranscodeOptions) {
14aed608
C
353 const videoPath = getHLSVideoPath(options)
354
d7a25329
C
355 if (options.copyCodecs) command = await presetCopy(command)
356 else command = await buildx264Command(command, options)
14aed608
C
357
358 command = command.outputOption('-hls_time 4')
359 .outputOption('-hls_list_size 0')
360 .outputOption('-hls_playlist_type vod')
361 .outputOption('-hls_segment_filename ' + videoPath)
362 .outputOption('-hls_segment_type fmp4')
363 .outputOption('-f hls')
364 .outputOption('-hls_flags single_file')
365
366 return command
367}
368
536598cf 369function getHLSVideoPath (options: HLSTranscodeOptions) {
7f8f8bdb
C
370 return `${dirname(options.outputPath)}/${options.hlsPlaylist.videoFilename}`
371}
372
536598cf
C
373async function fixHLSPlaylistIfNeeded (options: TranscodeOptions) {
374 if (options.type !== 'hls') return
7f8f8bdb 375
7f8f8bdb
C
376 const fileContent = await readFile(options.outputPath)
377
378 const videoFileName = options.hlsPlaylist.videoFilename
379 const videoFilePath = getHLSVideoPath(options)
380
536598cf 381 // Fix wrong mapping with some ffmpeg versions
7f8f8bdb
C
382 const newContent = fileContent.toString()
383 .replace(`#EXT-X-MAP:URI="${videoFilePath}",`, `#EXT-X-MAP:URI="${videoFileName}",`)
384
385 await writeFile(options.outputPath, newContent)
386}
387
5ba49f26 388function getVideoStreamFromFile (path: string) {
73c69591
C
389 return new Promise<any>((res, rej) => {
390 ffmpeg.ffprobe(path, (err, metadata) => {
391 if (err) return rej(err)
392
393 const videoStream = metadata.streams.find(s => s.codec_type === 'video')
3a149e9f 394 return res(videoStream || null)
73c69591
C
395 })
396 })
14d3270f 397}
4176e227
RK
398
399/**
400 * A slightly customised version of the 'veryfast' x264 preset
401 *
402 * The veryfast preset is right in the sweet spot of performance
403 * and quality. Superfast and ultrafast will give you better
404 * performance, but then quality is noticeably worse.
405 */
536598cf
C
406async function presetH264VeryFast (command: ffmpeg.FfmpegCommand, input: string, resolution: VideoResolution, fps?: number) {
407 let localCommand = await presetH264(command, input, resolution, fps)
408
cdf4cb9e 409 localCommand = localCommand.outputOption('-preset:v veryfast')
536598cf 410
4176e227
RK
411 /*
412 MAIN reference: https://slhck.info/video/2017/03/01/rate-control.html
413 Our target situation is closer to a livestream than a stream,
414 since we want to reduce as much a possible the encoding burden,
536598cf 415 although not to the point of a livestream where there is a hard
4176e227 416 constraint on the frames per second to be encoded.
4176e227 417 */
cdf4cb9e
C
418
419 return localCommand
4176e227
RK
420}
421
4176e227
RK
422/**
423 * A toolbox to play with audio
424 */
425namespace audio {
3a149e9f 426 export const get = (videoPath: string) => {
4176e227
RK
427 // without position, ffprobe considers the last input only
428 // we make it consider the first input only
4a5ccac5 429 // if you pass a file path to pos, then ffprobe acts on that file directly
7160878c 430 return new Promise<{ absolutePath: string, audioStream?: any }>((res, rej) => {
cdf4cb9e
C
431
432 function parseFfprobe (err: any, data: ffmpeg.FfprobeData) {
7160878c
RK
433 if (err) return rej(err)
434
435 if ('streams' in data) {
3a149e9f 436 const audioStream = data.streams.find(stream => stream[ 'codec_type' ] === 'audio')
7160878c
RK
437 if (audioStream) {
438 return res({
439 absolutePath: data.format.filename,
440 audioStream
441 })
4a5ccac5 442 }
7160878c 443 }
cdf4cb9e 444
7160878c 445 return res({ absolutePath: data.format.filename })
cdf4cb9e
C
446 }
447
3a149e9f 448 return ffmpeg.ffprobe(videoPath, parseFfprobe)
4a5ccac5 449 })
4176e227
RK
450 }
451
452 export namespace bitrate {
eed24d26 453 const baseKbitrate = 384
4176e227 454
9b474844 455 const toBits = (kbits: number) => kbits * 8000
4176e227
RK
456
457 export const aac = (bitrate: number): number => {
458 switch (true) {
9b474844
C
459 case bitrate > toBits(baseKbitrate):
460 return baseKbitrate
461
462 default:
463 return -1 // we interpret it as a signal to copy the audio stream as is
4176e227
RK
464 }
465 }
466
467 export const mp3 = (bitrate: number): number => {
7160878c
RK
468 /*
469 a 192kbit/sec mp3 doesn't hold as much information as a 192kbit/sec aac.
470 That's why, when using aac, we can go to lower kbit/sec. The equivalences
471 made here are not made to be accurate, especially with good mp3 encoders.
472 */
4176e227 473 switch (true) {
9b474844
C
474 case bitrate <= toBits(192):
475 return 128
476
477 case bitrate <= toBits(384):
478 return 256
479
480 default:
481 return baseKbitrate
4176e227
RK
482 }
483 }
484 }
485}
486
487/**
488 * Standard profile, with variable bitrate audio and faststart.
489 *
490 * As for the audio, quality '5' is the highest and ensures 96-112kbps/channel
491 * See https://trac.ffmpeg.org/wiki/Encode/AAC#fdk_vbr
492 */
536598cf 493async function presetH264 (command: ffmpeg.FfmpegCommand, input: string, resolution: VideoResolution, fps?: number) {
cdf4cb9e 494 let localCommand = command
4176e227
RK
495 .format('mp4')
496 .videoCodec('libx264')
52201311
C
497 .outputOption('-level 3.1') // 3.1 is the minimal resource allocation for our highest supported resolution
498 .outputOption('-b_strategy 1') // NOTE: b-strategy 1 - heuristic algorithm, 16 is optimal B-frames for it
4176e227 499 .outputOption('-bf 16') // NOTE: Why 16: https://github.com/Chocobozzz/PeerTube/pull/774. b-strategy 2 -> B-frames<16
408f50eb 500 .outputOption('-pix_fmt yuv420p') // allows import of source material with incompatible pixel formats (e.g. MJPEG video)
4a5ccac5 501 .outputOption('-map_metadata -1') // strip all metadata
4176e227 502 .outputOption('-movflags faststart')
4176e227 503
536598cf 504 const parsedAudio = await audio.get(input)
4176e227 505
cdf4cb9e
C
506 if (!parsedAudio.audioStream) {
507 localCommand = localCommand.noAudio()
508 } else if ((await checkFFmpegEncoders()).get('libfdk_aac')) { // we favor VBR, if a good AAC encoder is available
509 localCommand = localCommand
4176e227
RK
510 .audioCodec('libfdk_aac')
511 .audioQuality(5)
cdf4cb9e 512 } else {
536598cf 513 // we try to reduce the ceiling bitrate by making rough matches of bitrates
cdf4cb9e 514 // of course this is far from perfect, but it might save some space in the end
536598cf
C
515 localCommand = localCommand.audioCodec('aac')
516
cdf4cb9e 517 const audioCodecName = parsedAudio.audioStream[ 'codec_name' ]
cdf4cb9e 518
536598cf
C
519 if (audio.bitrate[ audioCodecName ]) {
520 const bitrate = audio.bitrate[ audioCodecName ](parsedAudio.audioStream[ 'bit_rate' ])
64e3e270 521 if (bitrate !== undefined && bitrate !== -1) localCommand = localCommand.audioBitrate(bitrate)
cdf4cb9e 522 }
4176e227
RK
523 }
524
536598cf
C
525 if (fps) {
526 // Constrained Encoding (VBV)
527 // https://slhck.info/video/2017/03/01/rate-control.html
528 // https://trac.ffmpeg.org/wiki/Limiting%20the%20output%20bitrate
529 const targetBitrate = getTargetBitrate(resolution, fps, VIDEO_TRANSCODING_FPS)
530 localCommand = localCommand.outputOptions([ `-maxrate ${targetBitrate}`, `-bufsize ${targetBitrate * 2}` ])
531
532 // Keyframe interval of 2 seconds for faster seeking and resolution switching.
533 // https://streaminglearningcenter.com/blogs/whats-the-right-keyframe-interval.html
534 // https://superuser.com/a/908325
535 localCommand = localCommand.outputOption(`-g ${fps * 2}`)
536 }
bcf21a37 537
cdf4cb9e 538 return localCommand
4176e227 539}
14aed608
C
540
541async function presetCopy (command: ffmpeg.FfmpegCommand): Promise<ffmpeg.FfmpegCommand> {
542 return command
543 .format('mp4')
544 .videoCodec('copy')
545 .audioCodec('copy')
546}
5c7d6508 547
3a149e9f 548async function presetOnlyAudio (command: ffmpeg.FfmpegCommand): Promise<ffmpeg.FfmpegCommand> {
5c7d6508 549 return command
550 .format('mp4')
551 .audioCodec('copy')
552 .noVideo()
553}