2021-08-27 07:32:44 -05:00
|
|
|
import express from 'express'
|
2023-07-31 07:34:36 -05:00
|
|
|
import truncate from 'lodash-es/truncate.js'
|
2023-04-21 07:55:10 -05:00
|
|
|
import { ErrorLevel, SitemapStream, streamToPromise } from 'sitemap'
|
2023-07-31 07:34:36 -05:00
|
|
|
import { logger } from '@server/helpers/logger.js'
|
|
|
|
import { getServerActor } from '@server/models/application/application.js'
|
|
|
|
import { buildNSFWFilter } from '../helpers/express-utils.js'
|
|
|
|
import { ROUTE_CACHE_LIFETIME, WEBSERVER } from '../initializers/constants.js'
|
2024-10-23 00:17:02 -05:00
|
|
|
import { apiRateLimiter, asyncMiddleware, cacheRoute } from '../middlewares/index.js'
|
2023-07-31 07:34:36 -05:00
|
|
|
import { AccountModel } from '../models/account/account.js'
|
|
|
|
import { VideoModel } from '../models/video/video.js'
|
|
|
|
import { VideoChannelModel } from '../models/video/video-channel.js'
|
2024-10-23 00:17:02 -05:00
|
|
|
import { VideoFileStream, VideoInclude } from '@peertube/peertube-models'
|
2018-12-05 10:27:24 -06:00
|
|
|
|
2023-07-25 08:18:10 -05:00
|
|
|
const sitemapRouter = express.Router()
|
2018-12-05 10:27:24 -06:00
|
|
|
|
2023-07-25 08:18:10 -05:00
|
|
|
sitemapRouter.use('/sitemap.xml',
|
|
|
|
apiRateLimiter,
|
2021-07-22 04:15:17 -05:00
|
|
|
cacheRoute(ROUTE_CACHE_LIFETIME.SITEMAP),
|
2018-12-05 10:27:24 -06:00
|
|
|
asyncMiddleware(getSitemap)
|
|
|
|
)
|
|
|
|
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
|
|
|
|
export {
|
2023-07-25 08:18:10 -05:00
|
|
|
sitemapRouter
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
|
|
|
|
async function getSitemap (req: express.Request, res: express.Response) {
|
|
|
|
let urls = getSitemapBasicUrls()
|
|
|
|
|
|
|
|
urls = urls.concat(await getSitemapLocalVideoUrls())
|
|
|
|
urls = urls.concat(await getSitemapVideoChannelUrls())
|
|
|
|
urls = urls.concat(await getSitemapAccountUrls())
|
|
|
|
|
2022-09-27 09:19:36 -05:00
|
|
|
const sitemapStream = new SitemapStream({
|
|
|
|
hostname: WEBSERVER.URL,
|
|
|
|
errorHandler: (err: Error, level: ErrorLevel) => {
|
|
|
|
if (level === 'warn') {
|
|
|
|
logger.warn('Warning in sitemap generation.', { err })
|
|
|
|
} else if (level === 'throw') {
|
|
|
|
logger.error('Error in sitemap generation.', { err })
|
|
|
|
|
|
|
|
throw err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
})
|
2018-12-05 10:27:24 -06:00
|
|
|
|
2020-04-01 10:02:52 -05:00
|
|
|
for (const urlObj of urls) {
|
|
|
|
sitemapStream.write(urlObj)
|
2020-04-01 07:16:19 -05:00
|
|
|
}
|
|
|
|
sitemapStream.end()
|
|
|
|
|
|
|
|
const xml = await streamToPromise(sitemapStream)
|
2018-12-05 10:27:24 -06:00
|
|
|
|
2019-10-21 07:50:55 -05:00
|
|
|
res.header('Content-Type', 'application/xml')
|
|
|
|
res.send(xml)
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
async function getSitemapVideoChannelUrls () {
|
|
|
|
const rows = await VideoChannelModel.listLocalsForSitemap('createdAt')
|
|
|
|
|
2023-10-19 09:13:22 -05:00
|
|
|
return rows.map(channel => ({ url: channel.getClientUrl() }))
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
async function getSitemapAccountUrls () {
|
|
|
|
const rows = await AccountModel.listLocalsForSitemap('createdAt')
|
|
|
|
|
2023-10-19 09:13:22 -05:00
|
|
|
return rows.map(account => ({ url: account.getClientUrl() }))
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
async function getSitemapLocalVideoUrls () {
|
2021-10-27 07:37:04 -05:00
|
|
|
const serverActor = await getServerActor()
|
|
|
|
|
2024-10-23 00:17:02 -05:00
|
|
|
let acc: { url: string, video: any[] }[] = []
|
|
|
|
|
|
|
|
const chunkSize = 200
|
|
|
|
let hasData = true
|
|
|
|
let i = 0
|
|
|
|
|
|
|
|
while (hasData && i < 1000) {
|
|
|
|
const { data } = await VideoModel.listForApi({
|
|
|
|
start: chunkSize * i,
|
|
|
|
count: chunkSize,
|
|
|
|
sort: 'createdAt',
|
|
|
|
displayOnlyForFollower: {
|
|
|
|
actorId: serverActor.id,
|
|
|
|
orLocalVideos: true
|
|
|
|
},
|
|
|
|
isLocal: true,
|
|
|
|
nsfw: buildNSFWFilter(),
|
|
|
|
countVideos: false,
|
|
|
|
include: VideoInclude.FILES | VideoInclude.TAGS
|
|
|
|
})
|
|
|
|
|
|
|
|
hasData = data.length !== 0
|
|
|
|
i++
|
|
|
|
|
|
|
|
acc = acc.concat(
|
|
|
|
data.map(v => {
|
|
|
|
const contentLoc = v.getHLSPlaylist()?.getMasterPlaylistUrl(v) ||
|
|
|
|
v.getMaxQualityFile(VideoFileStream.VIDEO)?.getFileUrl(v) ||
|
|
|
|
v.getMaxQualityFile(VideoFileStream.AUDIO)?.getFileUrl(v)
|
|
|
|
|
|
|
|
return {
|
|
|
|
url: WEBSERVER.URL + v.getWatchStaticPath(),
|
|
|
|
video: [
|
|
|
|
{
|
|
|
|
// Sitemap title should be < 100 characters
|
|
|
|
'title': truncate(v.name, { length: 100, omission: '...' }),
|
|
|
|
// Sitemap description should be < 2000 characters
|
|
|
|
'description': truncate(v.description || v.name, { length: 2000, omission: '...' }),
|
|
|
|
'player_loc': WEBSERVER.URL + v.getEmbedStaticPath(),
|
|
|
|
'thumbnail_loc': WEBSERVER.URL + v.getMiniatureStaticPath(),
|
|
|
|
'content_loc': contentLoc,
|
|
|
|
'duration': v.duration,
|
|
|
|
'view_count': v.views,
|
|
|
|
'publication_date': v.publishedAt.toISOString(),
|
|
|
|
'uploader': v.VideoChannel.getDisplayName(),
|
|
|
|
'uploader:info': v.VideoChannel.getClientUrl(),
|
|
|
|
'live': v.isLive ? 'YES' : 'NO',
|
|
|
|
'family_friendly': v.nsfw ? 'NO' : 'YES',
|
|
|
|
'rating': (v.likes * 5) / (v.likes + v.dislikes) || 0, // Rating is between 0.0 and 5.0
|
|
|
|
'tag': v.Tags.map(t => t.name)
|
|
|
|
}
|
|
|
|
]
|
|
|
|
}
|
|
|
|
})
|
|
|
|
)
|
|
|
|
}
|
2018-12-05 10:27:24 -06:00
|
|
|
|
2024-10-23 00:17:02 -05:00
|
|
|
return acc
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
function getSitemapBasicUrls () {
|
|
|
|
const paths = [
|
|
|
|
'/about/instance',
|
|
|
|
'/videos/local'
|
|
|
|
]
|
|
|
|
|
2019-04-11 04:33:44 -05:00
|
|
|
return paths.map(p => ({ url: WEBSERVER.URL + p }))
|
2018-12-05 10:27:24 -06:00
|
|
|
}
|