2024-08-13 03:49:31 -05:00
|
|
|
import { randomInt } from '@peertube/peertube-core-utils'
|
|
|
|
import { VideoResolution, VideoResolutionType } from '@peertube/peertube-models'
|
|
|
|
import { CONFIG } from '@server/initializers/config.js'
|
2024-06-21 07:32:25 -05:00
|
|
|
import { execa, Options as ExecaNodeOptions } from 'execa'
|
2023-07-31 07:34:36 -05:00
|
|
|
import { ensureDir, pathExists } from 'fs-extra/esm'
|
2024-08-13 07:16:00 -05:00
|
|
|
import { chmod, writeFile } from 'fs/promises'
|
2023-07-31 07:34:36 -05:00
|
|
|
import { OptionsOfBufferResponseBody } from 'got'
|
2022-03-21 02:33:27 -05:00
|
|
|
import { dirname, join } from 'path'
|
2023-07-31 07:34:36 -05:00
|
|
|
import { logger, loggerTagsFactory } from '../logger.js'
|
|
|
|
import { getProxy, isProxyEnabled } from '../proxy.js'
|
2024-08-14 08:32:25 -05:00
|
|
|
import { isBinaryResponse, unsafeSSRFGot } from '../requests.js'
|
2021-10-21 09:28:39 -05:00
|
|
|
|
2024-06-21 07:32:25 -05:00
|
|
|
type ProcessOptions = Pick<ExecaNodeOptions, 'cwd' | 'maxBuffer'>
|
|
|
|
|
2021-10-21 09:28:39 -05:00
|
|
|
const lTags = loggerTagsFactory('youtube-dl')
|
|
|
|
|
|
|
|
const youtubeDLBinaryPath = join(CONFIG.STORAGE.BIN_DIR, CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.NAME)
|
|
|
|
|
|
|
|
export class YoutubeDLCLI {
|
|
|
|
|
|
|
|
static async safeGet () {
|
|
|
|
if (!await pathExists(youtubeDLBinaryPath)) {
|
2022-03-21 02:33:27 -05:00
|
|
|
await ensureDir(dirname(youtubeDLBinaryPath))
|
|
|
|
|
2021-10-21 09:28:39 -05:00
|
|
|
await this.updateYoutubeDLBinary()
|
|
|
|
}
|
|
|
|
|
|
|
|
return new YoutubeDLCLI()
|
|
|
|
}
|
|
|
|
|
|
|
|
static async updateYoutubeDLBinary () {
|
|
|
|
const url = CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.URL
|
|
|
|
|
|
|
|
logger.info('Updating youtubeDL binary from %s.', url, lTags())
|
|
|
|
|
2022-12-29 03:24:06 -06:00
|
|
|
const gotOptions: OptionsOfBufferResponseBody = {
|
2024-08-13 07:16:00 -05:00
|
|
|
context: { bodyKBLimit: 100_000 },
|
2022-12-29 03:24:06 -06:00
|
|
|
responseType: 'buffer' as 'buffer'
|
|
|
|
}
|
|
|
|
|
|
|
|
if (process.env.YOUTUBE_DL_DOWNLOAD_BEARER_TOKEN) {
|
|
|
|
gotOptions.headers = {
|
|
|
|
authorization: 'Bearer ' + process.env.YOUTUBE_DL_DOWNLOAD_BEARER_TOKEN
|
|
|
|
}
|
|
|
|
}
|
2021-10-21 09:28:39 -05:00
|
|
|
|
|
|
|
try {
|
2024-08-14 08:32:25 -05:00
|
|
|
let gotResult = await unsafeSSRFGot(url, gotOptions)
|
2021-10-21 09:28:39 -05:00
|
|
|
|
|
|
|
if (!isBinaryResponse(gotResult)) {
|
|
|
|
const json = JSON.parse(gotResult.body.toString())
|
|
|
|
const latest = json.filter(release => release.prerelease === false)[0]
|
|
|
|
if (!latest) throw new Error('Cannot find latest release')
|
|
|
|
|
|
|
|
const releaseName = CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.NAME
|
|
|
|
const releaseAsset = latest.assets.find(a => a.name === releaseName)
|
|
|
|
if (!releaseAsset) throw new Error(`Cannot find appropriate release with name ${releaseName} in release assets`)
|
|
|
|
|
2024-08-14 08:32:25 -05:00
|
|
|
gotResult = await unsafeSSRFGot(releaseAsset.browser_download_url, gotOptions)
|
2021-10-21 09:28:39 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
if (!isBinaryResponse(gotResult)) {
|
|
|
|
throw new Error('Not a binary response')
|
|
|
|
}
|
|
|
|
|
|
|
|
await writeFile(youtubeDLBinaryPath, gotResult.body)
|
|
|
|
|
2024-08-13 07:16:00 -05:00
|
|
|
if (!CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.PYTHON_PATH) {
|
|
|
|
await chmod(youtubeDLBinaryPath, '744')
|
|
|
|
}
|
|
|
|
|
2021-10-21 09:28:39 -05:00
|
|
|
logger.info('youtube-dl updated %s.', youtubeDLBinaryPath, lTags())
|
|
|
|
} catch (err) {
|
|
|
|
logger.error('Cannot update youtube-dl from %s.', url, { err, ...lTags() })
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-31 07:34:36 -05:00
|
|
|
static getYoutubeDLVideoFormat (enabledResolutions: VideoResolutionType[], useBestFormat: boolean) {
|
2021-10-21 09:28:39 -05:00
|
|
|
/**
|
|
|
|
* list of format selectors in order or preference
|
|
|
|
* see https://github.com/ytdl-org/youtube-dl#format-selection
|
|
|
|
*
|
|
|
|
* case #1 asks for a mp4 using h264 (avc1) and the exact resolution in the hope
|
|
|
|
* of being able to do a "quick-transcode"
|
|
|
|
* case #2 is the first fallback. No "quick-transcode" means we can get anything else (like vp9)
|
|
|
|
* case #3 is the resolution-degraded equivalent of #1, and already a pretty safe fallback
|
|
|
|
*
|
|
|
|
* in any case we avoid AV1, see https://github.com/Chocobozzz/PeerTube/issues/3499
|
|
|
|
**/
|
2022-08-05 08:05:20 -05:00
|
|
|
|
|
|
|
let result: string[] = []
|
|
|
|
|
|
|
|
if (!useBestFormat) {
|
|
|
|
const resolution = enabledResolutions.length === 0
|
|
|
|
? VideoResolution.H_720P
|
|
|
|
: Math.max(...enabledResolutions)
|
|
|
|
|
|
|
|
result = [
|
|
|
|
`bestvideo[vcodec^=avc1][height=${resolution}]+bestaudio[ext=m4a]`, // case #1
|
|
|
|
`bestvideo[vcodec!*=av01][vcodec!*=vp9.2][height=${resolution}]+bestaudio`, // case #2
|
|
|
|
`bestvideo[vcodec^=avc1][height<=${resolution}]+bestaudio[ext=m4a]` // case #
|
|
|
|
]
|
|
|
|
}
|
|
|
|
|
|
|
|
return result.concat([
|
|
|
|
'bestvideo[vcodec!*=av01][vcodec!*=vp9.2]+bestaudio',
|
2021-10-21 09:28:39 -05:00
|
|
|
'best[vcodec!*=av01][vcodec!*=vp9.2]', // case fallback for known formats
|
2022-08-10 02:53:39 -05:00
|
|
|
'bestvideo[ext=mp4]+bestaudio[ext=m4a]',
|
2021-10-21 09:28:39 -05:00
|
|
|
'best' // Ultimate fallback
|
2022-08-05 08:05:20 -05:00
|
|
|
]).join('/')
|
2021-10-21 09:28:39 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
private constructor () {
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
download (options: {
|
|
|
|
url: string
|
|
|
|
format: string
|
|
|
|
output: string
|
2024-06-21 07:32:25 -05:00
|
|
|
processOptions: ProcessOptions
|
2022-02-09 06:37:04 -06:00
|
|
|
timeout?: number
|
2021-10-21 09:28:39 -05:00
|
|
|
additionalYoutubeDLArgs?: string[]
|
|
|
|
}) {
|
2022-08-10 02:53:39 -05:00
|
|
|
let args = options.additionalYoutubeDLArgs || []
|
|
|
|
args = args.concat([ '--merge-output-format', 'mp4', '-f', options.format, '-o', options.output ])
|
|
|
|
|
2021-10-21 09:28:39 -05:00
|
|
|
return this.run({
|
|
|
|
url: options.url,
|
|
|
|
processOptions: options.processOptions,
|
2022-02-09 04:40:47 -06:00
|
|
|
timeout: options.timeout,
|
2022-08-10 02:53:39 -05:00
|
|
|
args
|
2021-10-21 09:28:39 -05:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
async getInfo (options: {
|
|
|
|
url: string
|
|
|
|
format: string
|
2024-06-21 07:32:25 -05:00
|
|
|
processOptions: ProcessOptions
|
2021-10-21 09:28:39 -05:00
|
|
|
additionalYoutubeDLArgs?: string[]
|
|
|
|
}) {
|
|
|
|
const { url, format, additionalYoutubeDLArgs = [], processOptions } = options
|
|
|
|
|
|
|
|
const completeArgs = additionalYoutubeDLArgs.concat([ '--dump-json', '-f', format ])
|
|
|
|
|
|
|
|
const data = await this.run({ url, args: completeArgs, processOptions })
|
2022-08-18 04:40:07 -05:00
|
|
|
if (!data) return undefined
|
|
|
|
|
2022-10-10 08:33:32 -05:00
|
|
|
const info = data.map(d => JSON.parse(d))
|
2021-10-21 09:28:39 -05:00
|
|
|
|
|
|
|
return info.length === 1
|
|
|
|
? info[0]
|
|
|
|
: info
|
|
|
|
}
|
|
|
|
|
2022-10-10 08:33:32 -05:00
|
|
|
async getListInfo (options: {
|
2022-08-10 02:53:39 -05:00
|
|
|
url: string
|
|
|
|
latestVideosCount?: number
|
2024-06-21 07:32:25 -05:00
|
|
|
processOptions: ProcessOptions
|
2022-08-10 02:53:39 -05:00
|
|
|
}): Promise<{ upload_date: string, webpage_url: string }[]> {
|
|
|
|
const additionalYoutubeDLArgs = [ '--skip-download', '--playlist-reverse' ]
|
|
|
|
|
2022-09-07 10:30:21 -05:00
|
|
|
if (CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.NAME === 'yt-dlp') {
|
|
|
|
// Optimize listing videos only when using yt-dlp because it is bugged with youtube-dl when fetching a channel
|
|
|
|
additionalYoutubeDLArgs.push('--flat-playlist')
|
|
|
|
}
|
|
|
|
|
2022-08-10 02:53:39 -05:00
|
|
|
if (options.latestVideosCount !== undefined) {
|
|
|
|
additionalYoutubeDLArgs.push('--playlist-end', options.latestVideosCount.toString())
|
|
|
|
}
|
|
|
|
|
2022-10-10 08:33:32 -05:00
|
|
|
const result = await this.getInfo({
|
2022-08-10 02:53:39 -05:00
|
|
|
url: options.url,
|
|
|
|
format: YoutubeDLCLI.getYoutubeDLVideoFormat([], false),
|
|
|
|
processOptions: options.processOptions,
|
|
|
|
additionalYoutubeDLArgs
|
|
|
|
})
|
2022-10-10 08:33:32 -05:00
|
|
|
|
|
|
|
if (!result) return result
|
|
|
|
if (!Array.isArray(result)) return [ result ]
|
|
|
|
|
|
|
|
return result
|
2022-08-10 02:53:39 -05:00
|
|
|
}
|
|
|
|
|
2021-10-21 09:28:39 -05:00
|
|
|
async getSubs (options: {
|
|
|
|
url: string
|
|
|
|
format: 'vtt'
|
2024-06-21 07:32:25 -05:00
|
|
|
processOptions: ProcessOptions
|
2021-10-21 09:28:39 -05:00
|
|
|
}) {
|
|
|
|
const { url, format, processOptions } = options
|
|
|
|
|
|
|
|
const args = [ '--skip-download', '--all-subs', `--sub-format=${format}` ]
|
|
|
|
|
|
|
|
const data = await this.run({ url, args, processOptions })
|
|
|
|
const files: string[] = []
|
|
|
|
|
|
|
|
const skipString = '[info] Writing video subtitles to: '
|
|
|
|
|
|
|
|
for (let i = 0, len = data.length; i < len; i++) {
|
|
|
|
const line = data[i]
|
|
|
|
|
|
|
|
if (line.indexOf(skipString) === 0) {
|
|
|
|
files.push(line.slice(skipString.length))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return files
|
|
|
|
}
|
|
|
|
|
|
|
|
private async run (options: {
|
|
|
|
url: string
|
|
|
|
args: string[]
|
2022-02-09 04:40:47 -06:00
|
|
|
timeout?: number
|
2024-06-21 07:32:25 -05:00
|
|
|
processOptions: ProcessOptions
|
2021-10-21 09:28:39 -05:00
|
|
|
}) {
|
2022-02-09 04:40:47 -06:00
|
|
|
const { url, args, timeout, processOptions } = options
|
2021-10-21 09:28:39 -05:00
|
|
|
|
|
|
|
let completeArgs = this.wrapWithProxyOptions(args)
|
|
|
|
completeArgs = this.wrapWithIPOptions(completeArgs)
|
|
|
|
completeArgs = this.wrapWithFFmpegOptions(completeArgs)
|
|
|
|
|
2024-08-13 07:16:00 -05:00
|
|
|
const subProcessBinary = CONFIG.IMPORT.VIDEOS.HTTP.YOUTUBE_DL_RELEASE.PYTHON_PATH || youtubeDLBinaryPath
|
|
|
|
const subProcessArgs = [ ...completeArgs, url ]
|
|
|
|
if (subProcessBinary !== youtubeDLBinaryPath) subProcessArgs.unshift(youtubeDLBinaryPath)
|
|
|
|
|
|
|
|
const subProcess = execa(subProcessBinary, subProcessArgs, processOptions)
|
2022-02-09 04:40:47 -06:00
|
|
|
|
|
|
|
if (timeout) {
|
2024-06-21 07:32:25 -05:00
|
|
|
setTimeout(() => subProcess.kill(), timeout)
|
2022-02-09 04:40:47 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
const output = await subProcess
|
2021-10-21 09:28:39 -05:00
|
|
|
|
2022-08-10 02:53:39 -05:00
|
|
|
logger.debug('Run youtube-dl command.', { command: output.command, ...lTags() })
|
2021-10-21 09:28:39 -05:00
|
|
|
|
|
|
|
return output.stdout
|
|
|
|
? output.stdout.trim().split(/\r?\n/)
|
|
|
|
: undefined
|
|
|
|
}
|
|
|
|
|
|
|
|
private wrapWithProxyOptions (args: string[]) {
|
2024-08-13 03:49:31 -05:00
|
|
|
const config = CONFIG.IMPORT.VIDEOS.HTTP.PROXIES
|
|
|
|
const configProxyEnabled = Array.isArray(config) && config.length !== 0
|
|
|
|
|
|
|
|
if (configProxyEnabled || isProxyEnabled()) {
|
|
|
|
const proxy = configProxyEnabled
|
|
|
|
? config[randomInt(0, config.length)]
|
|
|
|
: getProxy()
|
|
|
|
|
|
|
|
logger.debug('Using proxy %s for YoutubeDL', proxy, lTags())
|
2021-10-21 09:28:39 -05:00
|
|
|
|
2024-08-13 03:49:31 -05:00
|
|
|
return [ '--proxy', proxy ].concat(args)
|
2021-10-21 09:28:39 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return args
|
|
|
|
}
|
|
|
|
|
|
|
|
private wrapWithIPOptions (args: string[]) {
|
|
|
|
if (CONFIG.IMPORT.VIDEOS.HTTP.FORCE_IPV4) {
|
|
|
|
logger.debug('Force ipv4 for YoutubeDL')
|
|
|
|
|
|
|
|
return [ '--force-ipv4' ].concat(args)
|
|
|
|
}
|
|
|
|
|
|
|
|
return args
|
|
|
|
}
|
|
|
|
|
|
|
|
private wrapWithFFmpegOptions (args: string[]) {
|
|
|
|
if (process.env.FFMPEG_PATH) {
|
|
|
|
logger.debug('Using ffmpeg location %s for YoutubeDL', process.env.FFMPEG_PATH, lTags())
|
|
|
|
|
|
|
|
return [ '--ffmpeg-location', process.env.FFMPEG_PATH ].concat(args)
|
|
|
|
}
|
|
|
|
|
|
|
|
return args
|
|
|
|
}
|
|
|
|
}
|