Skip to content

Commit

Permalink
Metadata to know if the caption is auto generated
Browse files Browse the repository at this point in the history
  • Loading branch information
Chocobozzz committed Jun 27, 2024
1 parent a252262 commit 29ccc0c
Show file tree
Hide file tree
Showing 22 changed files with 101 additions and 29 deletions.
1 change: 1 addition & 0 deletions packages/models/src/activitypub/objects/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ export * from './cache-file-object.js'
export * from './common-objects.js'
export * from './playlist-element-object.js'
export * from './playlist-object.js'
export * from './video-caption-object.js'
export * from './video-chapters-object.js'
export * from './video-comment-object.js'
export * from './video-object.js'
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
import { ActivityIdentifierObject } from './common-objects.js'

export interface VideoCaptionObject extends ActivityIdentifierObject {
automaticallyGenerated: boolean
}
3 changes: 2 additions & 1 deletion packages/models/src/activitypub/objects/video-object.ts
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import {
ActivityTagObject,
ActivityUrlObject
} from './common-objects.js'
import { VideoCaptionObject } from './video-caption-object.js'
import { VideoChapterObject } from './video-chapters-object.js'

export interface VideoObject {
Expand All @@ -18,7 +19,7 @@ export interface VideoObject {
category: ActivityIdentifierObject
licence: ActivityIdentifierObject
language: ActivityIdentifierObject
subtitleLanguage: ActivityIdentifierObject[]
subtitleLanguage: VideoCaptionObject[]

views: number

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -73,6 +73,7 @@ export interface VideoExportJSON {
language: string
filename: string
fileUrl: string
automaticallyGenerated: boolean
}[]

chapters: {
Expand Down
1 change: 1 addition & 0 deletions packages/models/src/videos/caption/video-caption.model.ts
Original file line number Diff line number Diff line change
Expand Up @@ -3,5 +3,6 @@ import { VideoConstant } from '../video-constant.model.js'
export interface VideoCaption {
language: VideoConstant<string>
captionPath: string
automaticallyGenerated: boolean
updatedAt: string
}
2 changes: 1 addition & 1 deletion packages/tests/package.json
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
"scripts": {
"build": "tsc",
"watch": "tsc -w",
"install-dependencies:transcription": "pip install -r ./requirements.txt ../transcription-devtools/requirements.txt"
"install-dependencies:transcription": "pip install -r ./requirements.txt -r ../transcription-devtools/requirements.txt"
},
"dependencies": {}
}
2 changes: 2 additions & 0 deletions packages/tests/src/api/videos/video-captions.ts
Original file line number Diff line number Diff line change
Expand Up @@ -72,12 +72,14 @@ describe('Test video captions', function () {
expect(caption1.language.id).to.equal('ar')
expect(caption1.language.label).to.equal('Arabic')
expect(caption1.captionPath).to.match(new RegExp('^/lazy-static/video-captions/' + uuidRegex + '-ar.vtt$'))
expect(caption1.automaticallyGenerated).to.be.false
await testCaptionFile(server.url, caption1.captionPath, 'Subtitle good 1.')

const caption2 = body.data[1]
expect(caption2.language.id).to.equal('zh')
expect(caption2.language.label).to.equal('Chinese')
expect(caption2.captionPath).to.match(new RegExp('^/lazy-static/video-captions/' + uuidRegex + '-zh.vtt$'))
expect(caption1.automaticallyGenerated).to.be.false
await testCaptionFile(server.url, caption2.captionPath, 'Subtitle good 2.')
}
})
Expand Down
10 changes: 5 additions & 5 deletions packages/tests/src/api/videos/video-transcription.ts
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ import {
waitJobs
} from '@peertube/peertube-server-commands'
import { FIXTURE_URLS } from '@tests/shared/fixture-urls.js'
import { checkCaption, checkLanguage, checkNoCaption, uploadForTranscription } from '@tests/shared/transcription.js'
import { checkAutoCaption, checkLanguage, checkNoCaption, uploadForTranscription } from '@tests/shared/transcription.js'

describe('Test video transcription', function () {
let servers: PeerTubeServer[]
Expand Down Expand Up @@ -48,7 +48,7 @@ describe('Test video transcription', function () {
await waitJobs(servers)
await checkLanguage(servers, uuid, 'en')

await checkCaption(servers, uuid)
await checkAutoCaption(servers, uuid)
})

it('Should run transcription on upload by default', async function () {
Expand All @@ -57,7 +57,7 @@ describe('Test video transcription', function () {
const uuid = await uploadForTranscription(servers[0])

await waitJobs(servers)
await checkCaption(servers, uuid)
await checkAutoCaption(servers, uuid)
await checkLanguage(servers, uuid, 'en')
})

Expand All @@ -73,7 +73,7 @@ describe('Test video transcription', function () {
})

await waitJobs(servers)
await checkCaption(servers, video.uuid)
await checkAutoCaption(servers, video.uuid)
await checkLanguage(servers, video.uuid, 'en')
})

Expand All @@ -96,7 +96,7 @@ describe('Test video transcription', function () {

await servers[0].live.waitUntilReplacedByReplay({ videoId: video.id })
await waitJobs(servers)
await checkCaption(servers, video.uuid, 'WEBVTT\n\n00:')
await checkAutoCaption(servers, video.uuid, 'WEBVTT\n\n00:')
await checkLanguage(servers, video.uuid, 'en')

await servers[0].config.enableLive({ allowReplay: false })
Expand Down
4 changes: 2 additions & 2 deletions packages/tests/src/peertube-runner/video-transcription.ts
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ import {
} from '@peertube/peertube-server-commands'
import { checkPeerTubeRunnerCacheIsEmpty } from '@tests/shared/directories.js'
import { PeerTubeRunnerProcess } from '@tests/shared/peertube-runner-process.js'
import { checkCaption, checkLanguage, checkNoCaption, uploadForTranscription } from '@tests/shared/transcription.js'
import { checkAutoCaption, checkLanguage, checkNoCaption, uploadForTranscription } from '@tests/shared/transcription.js'

describe('Test transcription in peertube-runner program', function () {
let servers: PeerTubeServer[] = []
Expand Down Expand Up @@ -46,7 +46,7 @@ describe('Test transcription in peertube-runner program', function () {
const uuid = await uploadForTranscription(servers[0])
await waitJobs(servers, { runnerJobs: true })

await checkCaption(servers, uuid)
await checkAutoCaption(servers, uuid)
await checkLanguage(servers, uuid, 'en')
})

Expand Down
3 changes: 2 additions & 1 deletion packages/tests/src/shared/transcription.ts
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ export function getCustomModelPath (modelName: CustomModelName) {

// ---------------------------------------------------------------------------

export async function checkCaption (servers: PeerTubeServer[], uuid: string, captionContains = 'WEBVTT\n\n00:00.000 --> 00:') {
export async function checkAutoCaption (servers: PeerTubeServer[], uuid: string, captionContains = 'WEBVTT\n\n00:00.000 --> 00:') {
for (const server of servers) {
const body = await server.captions.list({ videoId: uuid })
expect(body.total).to.equal(1)
Expand All @@ -37,6 +37,7 @@ export async function checkCaption (servers: PeerTubeServer[], uuid: string, cap
const caption = body.data[0]
expect(caption.language.id).to.equal('en')
expect(caption.language.label).to.equal('English')
expect(caption.automaticallyGenerated).to.be.true

{
await testCaptionFile(server.url, caption.captionPath, captionContains)
Expand Down
7 changes: 6 additions & 1 deletion server/core/controllers/api/videos/captions.ts
Original file line number Diff line number Diff line change
Expand Up @@ -81,7 +81,12 @@ async function createVideoCaption (req: express.Request, res: express.Response)

const captionLanguage = req.params.captionLanguage

const videoCaption = await createLocalCaption({ video, language: captionLanguage, path: videoCaptionPhysicalFile.path })
const videoCaption = await createLocalCaption({
video,
language: captionLanguage,
path: videoCaptionPhysicalFile.path,
automaticallyGenerated: false
})

await sequelizeTypescript.transaction(async t => {
await federateVideoIfNeeded(video, false, t)
Expand Down
1 change: 1 addition & 0 deletions server/core/helpers/activity-pub-utils.ts
Original file line number Diff line number Diff line change
Expand Up @@ -73,6 +73,7 @@ const contextStore: { [ id in ContextType ]: (string | { [ id: string ]: string
category: 'sc:category',
licence: 'sc:license',
subtitleLanguage: 'sc:subtitleLanguage',
automaticallyGenerated: 'pt:automaticallyGenerated',
sensitive: 'as:sensitive',
language: 'sc:inLanguage',
identifier: 'sc:identifier',
Expand Down
2 changes: 1 addition & 1 deletion server/core/initializers/constants.ts
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ import { cpus } from 'os'

// ---------------------------------------------------------------------------

const LAST_MIGRATION_VERSION = 855
const LAST_MIGRATION_VERSION = 860

// ---------------------------------------------------------------------------

Expand Down
31 changes: 31 additions & 0 deletions server/core/initializers/migrations/0860-caption-generated.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
import * as Sequelize from 'sequelize'

async function up (utils: {
transaction: Sequelize.Transaction
queryInterface: Sequelize.QueryInterface
sequelize: Sequelize.Sequelize
}): Promise<void> {
const { transaction } = utils

{
await utils.queryInterface.addColumn('videoCaption', 'automaticallyGenerated', {
type: Sequelize.BOOLEAN,
defaultValue: false,
allowNull: false
}, { transaction })

await utils.queryInterface.changeColumn('videoCaption', 'automaticallyGenerated', {
type: Sequelize.BOOLEAN,
defaultValue: null,
allowNull: false
}, { transaction })
}
}

function down (options) {
throw new Error('Not implemented.')
}

export {
down, up
}
Original file line number Diff line number Diff line change
Expand Up @@ -155,6 +155,7 @@ export function getCaptionAttributesFromObject (video: MVideoId, videoObject: Vi
videoId: video.id,
filename: VideoCaptionModel.generateCaptionName(c.identifier),
language: c.identifier,
automaticallyGenerated: c.automaticallyGenerated === true,
fileUrl: c.url
}))
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -198,6 +198,7 @@ export class VideosExporter extends AbstractUserExporter <VideoExportJSON> {
updatedAt: c.updatedAt.toISOString(),
language: c.language,
filename: c.filename,
automaticallyGenerated: c.automaticallyGenerated,
fileUrl: c.getFileUrl(video)
}))
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -97,6 +97,7 @@ export class VideosImporter extends AbstractUserImporter <VideoExportJSON, Impor
if (!isArray(o.chapters)) o.chapters = []

o.tags = o.tags.filter(t => isVideoTagValid(t))

o.captions = o.captions.filter(c => isVideoCaptionLanguageValid(c.language))
o.chapters = o.chapters.filter(c => isVideoChapterTimecodeValid(c.timecode) && isVideoChapterTitleValid(c.title))

Expand Down Expand Up @@ -269,7 +270,12 @@ export class VideosImporter extends AbstractUserImporter <VideoExportJSON, Impor

if (!await this.isFileValidOrLog(absoluteFilePath, CONSTRAINTS_FIELDS.VIDEO_CAPTIONS.CAPTION_FILE.FILE_SIZE.max)) continue

await createLocalCaption({ video, language: captionImport.language, path: absoluteFilePath })
await createLocalCaption({
video,
language: captionImport.language,
path: absoluteFilePath,
automaticallyGenerated: captionImport.automaticallyGenerated === true
})

captionPaths.push(absoluteFilePath)
}
Expand Down
9 changes: 6 additions & 3 deletions server/core/lib/video-captions.ts
Original file line number Diff line number Diff line change
Expand Up @@ -25,13 +25,15 @@ export async function createLocalCaption (options: {
video: MVideo
path: string
language: string
automaticallyGenerated: boolean
}) {
const { language, path, video } = options
const { language, path, video, automaticallyGenerated } = options

const videoCaption = new VideoCaptionModel({
videoId: video.id,
filename: VideoCaptionModel.generateCaptionName(language),
language
language,
automaticallyGenerated
}) as MVideoCaption

await moveAndProcessCaptionFile({ path }, videoCaption)
Expand Down Expand Up @@ -148,7 +150,8 @@ export async function onTranscriptionEnded (options: {
const caption = await createLocalCaption({
video,
language,
path: vttPath
path: vttPath,
automaticallyGenerated: true
})

await sequelizeTypescript.transaction(async t => {
Expand Down
7 changes: 6 additions & 1 deletion server/core/lib/video-pre-import.ts
Original file line number Diff line number Diff line change
Expand Up @@ -317,7 +317,12 @@ async function processYoutubeSubtitles (youtubeDL: YoutubeDLWrapper, targetUrl:
continue
}

await createLocalCaption({ language: subtitle.language, path: subtitle.path, video })
await createLocalCaption({
language: subtitle.language,
path: subtitle.path,
video,
automaticallyGenerated: false
})

logger.info('Added %s youtube-dl subtitle', subtitle.path)
}
Expand Down
26 changes: 16 additions & 10 deletions server/core/models/video/video-caption.ts
Original file line number Diff line number Diff line change
@@ -1,3 +1,12 @@
import { VideoCaption, VideoCaptionObject } from '@peertube/peertube-models'
import { buildUUID } from '@peertube/peertube-node-utils'
import {
MVideo,
MVideoCaption,
MVideoCaptionFormattable,
MVideoCaptionLanguageUrl,
MVideoCaptionVideo
} from '@server/types/models/index.js'
import { remove } from 'fs-extra/esm'
import { join } from 'path'
import { Op, OrderItem, Transaction } from 'sequelize'
Expand All @@ -13,15 +22,6 @@ import {
Table,
UpdatedAt
} from 'sequelize-typescript'
import { ActivityIdentifierObject, VideoCaption } from '@peertube/peertube-models'
import {
MVideo,
MVideoCaption,
MVideoCaptionFormattable,
MVideoCaptionLanguageUrl,
MVideoCaptionVideo
} from '@server/types/models/index.js'
import { buildUUID } from '@peertube/peertube-node-utils'
import { isVideoCaptionLanguageValid } from '../../helpers/custom-validators/video-captions.js'
import { logger } from '../../helpers/logger.js'
import { CONFIG } from '../../initializers/config.js'
Expand Down Expand Up @@ -81,6 +81,10 @@ export class VideoCaptionModel extends SequelizeModel<VideoCaptionModel> {
@Column(DataType.STRING(CONSTRAINTS_FIELDS.COMMONS.URL.max))
fileUrl: string

@AllowNull(false)
@Column
automaticallyGenerated: boolean

@ForeignKey(() => VideoModel)
@Column
videoId: number
Expand Down Expand Up @@ -228,15 +232,17 @@ export class VideoCaptionModel extends SequelizeModel<VideoCaptionModel> {
id: this.language,
label: VideoCaptionModel.getLanguageLabel(this.language)
},
automaticallyGenerated: this.automaticallyGenerated,
captionPath: this.getCaptionStaticPath(),
updatedAt: this.updatedAt.toISOString()
}
}

toActivityPubObject (this: MVideoCaptionLanguageUrl, video: MVideo): ActivityIdentifierObject {
toActivityPubObject (this: MVideoCaptionLanguageUrl, video: MVideo): VideoCaptionObject {
return {
identifier: this.language,
name: VideoCaptionModel.getLanguageLabel(this.language),
automaticallyGenerated: this.automaticallyGenerated,
url: this.getFileUrl(video)
}
}
Expand Down
2 changes: 1 addition & 1 deletion server/core/models/video/video.ts
Original file line number Diff line number Diff line change
Expand Up @@ -1886,7 +1886,7 @@ export class VideoModel extends SequelizeModel<VideoModel> {
if (isArray(videoAP.VideoCaptions)) return videoAP.VideoCaptions

return this.$get('VideoCaptions', {
attributes: [ 'filename', 'language', 'fileUrl' ],
attributes: [ 'filename', 'language', 'fileUrl', 'automaticallyGenerated' ],
transaction
}) as Promise<MVideoCaptionLanguageUrl[]>
}
Expand Down
3 changes: 2 additions & 1 deletion server/core/types/models/video/video-caption.ts
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,8 @@ export type MVideoCaption = Omit<VideoCaptionModel, 'Video'>

export type MVideoCaptionLanguage = Pick<MVideoCaption, 'language'>
export type MVideoCaptionLanguageUrl =
Pick<MVideoCaption, 'language' | 'fileUrl' | 'filename' | 'getFileUrl' | 'getCaptionStaticPath' | 'toActivityPubObject'>
Pick<MVideoCaption, 'language' | 'fileUrl' | 'filename' | 'automaticallyGenerated' | 'getFileUrl' | 'getCaptionStaticPath' |
'toActivityPubObject'>

export type MVideoCaptionVideo =
MVideoCaption &
Expand Down

0 comments on commit 29ccc0c

Please sign in to comment.