diff --git a/.github/workflows/auto-publish.yml b/.github/workflows/auto-publish.yml
new file mode 100644
index 0000000..4ca6ca9
--- /dev/null
+++ b/.github/workflows/auto-publish.yml
@@ -0,0 +1,36 @@
+# Workflow based on the main w3c/spec-prod action example:
+# https://github.com/w3c/spec-prod/#basic-usage
+
+name: Build, Validate, Deploy and Publish
+
+on:
+  # Worflow runs on pull requests where it makes sure that the spec can still be
+  # generated, that markup is valid and that there are no broken links, as
+  # well as on pushes to the default branch where it also deploys the generated
+  # spec to the gh-pages branch and publishes the result to /TR.
+  # The "workflow_dispatch" hook allows admins to also trigger the workflow
+  # manually from GitHub's UI.
+  pull_request: {}
+  push:
+    branches: [main]
+  workflow_dispatch:
+
+jobs:
+  main:
+    runs-on: ubuntu-20.04
+    steps:
+      # See doc at https://github.com/actions/checkout#checkout-v2
+      - name: Checkout repository
+        uses: actions/checkout@v2
+
+      # See doc at https://github.com/w3c/spec-prod/#spec-prod
+      # The action only deploys the generated spec to the gh-pages branch when
+      # the workflow was triggered by a push to the default branch.
+      - name: Build and validate index.html, push to gh-pages branch if needed
+        uses: w3c/spec-prod@v2
+        with:
+          GH_PAGES_BRANCH: gh-pages
+          W3C_ECHIDNA_TOKEN: ${{ secrets.ECHIDNA_TOKEN }}
+          W3C_WG_DECISION_URL: https://github.com/w3c/media-wg/issues/27
+          W3C_BUILD_OVERRIDE: |
+            status: WD
diff --git a/.github/workflows/tidy.yaml b/.github/workflows/tidy.yaml
new file mode 100644
index 0000000..7fb7a22
--- /dev/null
+++ b/.github/workflows/tidy.yaml
@@ -0,0 +1,21 @@
+name: Tidy document
+on:
+  workflow_dispatch: {}
+  push:
+    branches:
+      - gh-pages
+    paths:
+      - index.html
+
+jobs:
+  tidy:
+    name: Tidy up
+    runs-on: macos-latest
+    steps:
+      - uses: actions/checkout@v4
+      - run: make
+      - uses: peter-evans/create-pull-request@v6
+        with:
+          title: "Tidied up source"
+          commit-message: "chore(index.bs): tidy up"
+          branch: tidy
diff --git a/.travis.yml b/.travis.yml
deleted file mode 100644
index 7a24eaa..0000000
--- a/.travis.yml
+++ /dev/null
@@ -1,12 +0,0 @@
-language: generic
-
-script: bash ./deploy.sh
-
-branches:
-  only:
-    - master
-
-env:
-  global:
-  - ENCRYPTION_LABEL: 9b5128ce1dd6
-  - COMMIT_AUTHOR_EMAIL: travis-ci@w3.org
diff --git a/README.md b/README.md
index 7cc31ed..f55ecaf 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,4 @@
-# Media Session Standard
+# Media Session API
 
 https://w3c.github.io/mediasession/
 
diff --git a/deploy.sh b/deploy.sh
deleted file mode 100644
index 56f8c09..0000000
--- a/deploy.sh
+++ /dev/null
@@ -1,63 +0,0 @@
-#!/bin/bash
-set -e # Exit with nonzero exit code if anything fails
-
-SOURCE_BRANCH="master"
-TARGET_BRANCH="gh-pages"
-
-# Pull requests and commits to other branches shouldn't try to deploy, just build to verify
-if [ "$TRAVIS_PULL_REQUEST" != "false" -o "$TRAVIS_BRANCH" != "$SOURCE_BRANCH" ]; then
-    echo "Skipping deploy; just doing a build."
-    curl https://api.csswg.org/bikeshed/ -f -F file=@index.bs > index.html;
-    exit 0
-fi
-
-# Save some useful information
-REPO=`git config remote.origin.url`
-SSH_REPO=${REPO/https:\/\/github.com\//git@github.com:}
-SHA=`git rev-parse --verify HEAD`
-
-# Clone the existing gh-pages for this repo into out/
-# Create a new empty branch if gh-pages doesn't exist yet (should only happen on first deply)
-git clone $REPO out
-cd out
-git checkout $TARGET_BRANCH || git checkout --orphan $TARGET_BRANCH
-cd ..
-
-# Clean out existing contents
-rm -rf out/* || exit 0
-
-# Re-format.
-
-./format.py index.bs
-
-# Re-generating.
-curl https://api.csswg.org/bikeshed/ -f -F file=@index.bs > out/index.html;
-
-# Now let's go have some fun with the cloned repo
-cd out
-git config user.name "Travis CI"
-git config user.email "$COMMIT_AUTHOR_EMAIL"
-
-# If there are no changes to the compiled out (e.g. this is a README update) then just bail.
-if [[ -z $(git status -s) ]]; then
-    echo "No changes to the output on this push; exiting."
-    exit 0
-fi
-
-# Commit the "changes", i.e. the new version.
-# The delta will show diffs between new and old versions.
-git add .
-git commit -m "Deploy to GitHub Pages: ${SHA}"
-
-# Get the deploy key by using Travis's stored variables to decrypt deploy_key.enc
-ENCRYPTED_KEY_VAR="encrypted_${ENCRYPTION_LABEL}_key"
-ENCRYPTED_IV_VAR="encrypted_${ENCRYPTION_LABEL}_iv"
-ENCRYPTED_KEY=${!ENCRYPTED_KEY_VAR}
-ENCRYPTED_IV=${!ENCRYPTED_IV_VAR}
-openssl aes-256-cbc -K $ENCRYPTED_KEY -iv $ENCRYPTED_IV -in ../deploy_key.enc -out deploy_key -d
-chmod 600 deploy_key
-eval `ssh-agent -s`
-ssh-add deploy_key
-
-# Now that we're all set up, we can push.
-git push $SSH_REPO $TARGET_BRANCH
diff --git a/deploy_key.enc b/deploy_key.enc
deleted file mode 100644
index 4c0b312..0000000
Binary files a/deploy_key.enc and /dev/null differ
diff --git a/explainer.md b/explainer.md
index 142a186..0e37c4a 100644
--- a/explainer.md
+++ b/explainer.md
@@ -106,9 +106,10 @@ interface MediaSession : EventTarget {
 
 ### The `MediaMetadata` interface
 
-A `MediaMetadata` object can contain media metadata like title, artist, album
-and album art. To set the metadata for a `MediaSession`, the page should create
-a `MediaMetadata` object and assign it to a `MediaSession` object:
+A `MediaMetadata` object can contain media metadata like title, artist, album,
+artwork, and video chapter information. To set the metadata for a `MediaSession`,
+the page should create a `MediaMetadata` object and assign it to a `MediaSession`
+object:
 
 ```javascript
 navigator.mediaSession.metadata = new MediaMetadata(/* MediaMetadata constructor */);
@@ -123,6 +124,7 @@ interface MediaMetadata {
     attribute DOMString artist;
     attribute DOMString album;
     attribute FrozenArray<MediaImage> artwork;
+    [SameObject] readonly attribute FrozenArray<ChapterInformation> chapterInfo;
 };
 
 dictionary MediaImage {
@@ -130,6 +132,13 @@ dictionary MediaImage {
   DOMString sizes = "";
   DOMString type = "";
 };
+
+[Exposed=Window]
+interface ChapterInformation {
+  readonly attribute DOMString title;
+  readonly attribute double startTime;
+  [SameObject] readonly attribute FrozenArray<MediaImage> artwork;
+};
 ```
 
 ### The `MediaPositionState` dictionary
diff --git a/format.py b/format.py
index f7051a6..ec7a3a1 100755
--- a/format.py
+++ b/format.py
@@ -36,10 +36,10 @@ def tokenize(source):
 def validate(path, source, tokens):
     stack = []
 
-    def fail(reason, offset):
+    def fail(reason, offset, source, path):
         lineno = source.count('\n', 0, offset) + 1
-        print '%s:%s: error: %s' % (path, lineno, reason)
-        print source.splitlines()[lineno - 1]
+        print(f'{path}:{lineno}: error: {reason}')
+        print(source.splitlines()[lineno - 1])
         sys.exit(1)
 
     for token, start, end, name in tokens:
diff --git a/index.bs b/index.bs
index 6c7f034..d576178 100644
--- a/index.bs
+++ b/index.bs
@@ -1,15 +1,19 @@
 <pre class="metadata">
-Title: Media Session Standard
+Title: Media Session
 Repository: w3c/mediasession
 Status: ED
-ED: https://w3c.github.io/mediasession
+ED: https://w3c.github.io/mediasession/
+TR: https://www.w3.org/TR/mediasession/
 Shortname: mediasession
-Level: 1
-Editor: Mounir Lamouri, w3cid 45389, Google Inc., mlamouri@google.com
-Editor: Becca Hughes, w3cid 103353, Google Inc., beccahughes@google.com
+Level: None
+Editor: Tommy Steimel, w3cid 135774, Google Inc., steimel@google.com
+Editor: Youenn Fablet, w3cid 96458, Apple Inc., youenn@apple.com
+Former Editor: Mounir Lamouri, w3cid 45389, Google Inc., mlamouri@google.com
+Former Editor: Becca Hughes, w3cid 103353, Google Inc., beccahughes@google.com
 Former Editor: Zhiqiang Zhang, Google Inc., zqzhang@google.com
 Former Editor: Rich Tibbett, Opera, richt@opera.com
 
+Markup Shorthands: markdown yes
 Group: mediawg
 Logo: https://resources.whatwg.org/logo-mediasession.svg
 Abstract: This specification enables web developers to show customized media
@@ -17,12 +21,8 @@ Abstract: metadata on platform UI, customize available platform media
 Abstract: controls, and access platform media keys such as hardware keys found
 Abstract: on keyboards, headsets, remote controls, and software keys found in
 Abstract: notification areas and on lock screens of mobile devices.
-!Participate: <a href="https://github.com/w3c/mediasession/">We are on GitHub</a>
-!Participate: <a href="https://github.com/w3c/mediasession/issues/new">File an issue</a>
-!Participate: <a href="https://github.com/w3c/mediasession/issues?state=open">Open issues</a>
 !Version History: <a href="https://github.com/w3c/mediasession/commits">https://github.com/w3c/mediasession/commits</a>
 Ignored Vars: context, media, session
-Boilerplate: omit conformance, omit feedback-header
 </pre>
 
 <style>
@@ -48,67 +48,17 @@ table td, table th {
 }
 </style>
 
+<pre class="link-defaults">
+spec:html; type:element; text:link
+</pre>
+
 <pre class="anchors">
 urlPrefix: https://html.spec.whatwg.org/multipage/; spec: HTML
     type: dfn
-        urlPrefix: infrastructure.html
-            text: case-sensitive; url: #case-sensitivity-and-string-comparison
-            text: ASCII case-insensitive; url: #ascii-case-insensitive
-            text: in parallel
-            text: unordered set of unique space-separated tokens; url: #unordered-set-of-unique-space-separated-tokens
-            text: document base url
-            text: MIME type
-        urlPrefix: embedded-content.html
-            text: media element
-            text: muted; url: #concept-media-muted
-            text: pause event; url: #event-media-pause
-            text: play event; url: #event-media-play
-            text: potentially playing
-        urlPrefix: browsers.html
-            text: browsing context
-            text: top-level browsing context
-            text: nested browsing context
         urlPrefix: webappapis.html
-            text: API base URL
             text: entry settings object
-            text: queue a task
-            text: task
-            text: task source
-        urlPrefix: semantics.html
-            text: link; for: HTMLLinkElement; url:#the-link-element
         urlPrefix: interaction.html
-            text: triggered by user activation
-    type: attribute
-        urlPrefix: semantics.html
-            text: sizes; for: HTMLLinkElement; url: #attr-link-sizes;
-urlPrefix: https://url.spec.whatwg.org/; spec: URL
-    type: dfn; urlPrefix: #concept-
-        text: url parser
-    type: dfn
-        text: absolute URL; url: #syntax-url-absolute
-        text: relative URL; url: #syntax-url-relative
-urlPrefix: https://fetch.spec.whatwg.org/; spec: FETCH
-    type: dfn; urlPrefix: #concept-
-        text: fetch
-        text: request
-        text: context; url: request-context
-        text: context frame type; url: request-context-frame-type
-        text: internal response
-        text: origin; url: request-origin
-        text: referrer; url: request-referrer
-        text: response
-        text: response type
-        text: url; url: request-url
-    type: dfn;
-        text: force Origin header flag
-urlPrefix: https://www.w3.org/TR/appmanifest/; spec: appmanifest
-    type: dfn
-        text: image object; url: #dfn-image-object
-urlPrefix: https://heycam.github.io/webidl/
-    type: exception
-        text: TypeError
-urlPrefix: https://tc39.github.io/ecma262/#sec-object.; type: dfn
-    text: freeze
+            text: activation notification
 </pre>
 
 <h2 id="introduction">Introduction</h2>
@@ -117,49 +67,11 @@ urlPrefix: https://tc39.github.io/ecma262/#sec-object.; type: dfn
 
 Media is used extensively today, and the Web is one of the primary means of
 consuming media content. Many platforms can display media metadata, such as
-title, artist, album and album art on various UI elements such as notification,
-media control center, device lockscreen and wearable devices. This specification
-aims to enable web pages to specify the media metadata to be displayed in
-platform UI, and respond to media controls which may come from platform UI or
-media keys, thereby improving the user experience.
-
-<h2 id="conformance">Conformance</h2>
-
-All diagrams, examples, and notes in this specification are non-normative, as
-are all sections explicitly marked non-normative. Everything else in this
-specification is normative.
-
-The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD",
-"SHOULD NOT", "RECOMMENDED", "NOT RECOMMENDED", "MAY", and "OPTIONAL" in this
-document are to be interpreted as described in RFC 2119. For readability, these
-words do not appear in all uppercase letters in this specification. [[!RFC2119]]
-
-Requirements phrased in the imperative as part of algorithms (such as "strip any
-leading space characters" or "return false and terminate these steps") are to be
-interpreted with the meaning of the key word ("must", "should", "may", etc) used
-in introducing the algorithm.
-
-Conformance requirements phrased as algorithms or specific steps may be
-implemented in any manner, so long as the end result is equivalent. (In
-particular, the algorithms defined in this specification are intended to be easy
-to follow, and not intended to be performant.)
-
-User agents may impose implementation-specific limits on otherwise unconstrained
-inputs, e.g. to prevent denial of service attacks, to guard against running out
-of memory, or to work around platform-specific limitations.
-
-When a method or an attribute is said to call another method or attribute, the
-user agent must invoke its internal API for that attribute or method so that
-e.g. the author can't change the behavior by overriding attributes or methods
-with custom properties or functions in JavaScript.
-
-Unless otherwise stated, string comparisons are done in a <a>case-sensitive</a>
-manner.
-
-<h2 id="dependencies">Dependencies</h2>
-
-The IDL fragments in this specification must be interpreted as required for
-conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
+title, artist, album and album art on various UI elements such as notifications,
+media control center, device lockscreen, and wearable devices. This
+specification aims to enable web pages to specify the media metadata to be
+displayed in platform UI, and respond to media controls that may come from
+platform UI or media keys, thereby improving the user experience.
 
 <section>
   <h2 id='security-privacy-considerations'>Security and Privacy
@@ -245,37 +157,36 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     <h3 id='playback-state-model'>Playback State</h3>
 
     <p>
-      In order to make <a enum-value for="MediaSessionAction">play</a> and
-      <a enum-value for="MediaSessionAction">pause</a> actions work properly,
-      the user agent SHOULD be able to determine if a <a>browsing context</a> of
-      the <a>active media session</a> is playing media or not, which is called
-      the <dfn>guessed playback state</dfn>. The RECOMMENDED way for determining
-      the <a>guessed playback state</a> is to monitor the media elements whose
-      node document's browsing context is the <a>browsing context</a>. The
-      <a>browsing context</a>'s <a>guessed playback state</a> is <a enum-value
-      for="MediaSessionPlaybackState">playing</a> if any of them is
-      <a>potentially playing</a> and not <a>muted</a>, and is <a enum-value
-      for="MediaSessionPlaybackState">paused</a> otherwise. Other information
-      SHOULD also be considered, such as WebAudio and plugins.
+      In order to make {{MediaSessionAction/play}} and
+      {{MediaSessionAction/pause}} actions work properly, the user agent SHOULD
+      be able to determine if a [=/browsing context=] of the <a>active media
+      session</a> is playing media or not, which is called the <dfn>guessed
+      playback state</dfn>. The RECOMMENDED way for determining the <a>guessed
+      playback state</a> is to monitor the media elements whose node document's
+      [=Document/browsing context=] is the [=/browsing context=]. The
+      [=/browsing context=]'s <a>guessed playback state</a> is
+      {{MediaSessionPlaybackState/"playing"}} if any of them is
+      [=media element/potentially playing=] and not [=media element/muted=],
+      and is {{MediaSessionPlaybackState/"paused"}} otherwise. Other
+      information SHOULD also be considered, such as WebAudio and plugins.
     </p>
 
     <p>
-      The <a attribute for="MediaSession">playbackState</a> attribute specifies
-      the <a>declared playback state</a> from the <a>browsing context</a>. The
-      state is combined with the <a>guessed playback state</a> to compute the
+      The {{MediaSession/playbackState}} attribute specifies the <a>declared
+      playback state</a> from the [=/browsing context=]. The state is combined
+      with the <a>guessed playback state</a> to compute the
       <dfn>actual playback state</dfn>, which is a finalized state and will be
-      used for
-      <a enum-value for="MediaSessionAction">play</a> and
-      <a enum-value for="MediaSessionAction">pause</a> actions.
+      used for {{MediaSessionAction/play}} and {{MediaSessionAction/pause}}
+      actions.
     </p>
 
     <p>
       The <a>actual playback state</a> is computed in the following way:
       <ul>
         <li>
-          If the <a>declared playback state</a> is <a enum-value
-          for="MediaSessionPlaybackState">playing</a>, return <a enum-value
-          for="MediaSessionPlaybackState">playing</a>.
+          If the <a>declared playback state</a> is
+          {{MediaSessionPlaybackState/playing}}, return
+          {{MediaSessionPlaybackState/playing}}.
         </li>
         <li>
           Otherwise, return the <a>guessed playback state</a>.
@@ -286,9 +197,9 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     <p class=note>
       The {{MediaSession/playbackState}} attribute could be useful when the page
       wants to do some preparation steps when the media is paused but it allows
-      the preparation steps to be interrupted by <a enum-value
-      for="MediaSessionAction">pause</a> action. See <a
-      href="#example-set-playbackState">Setting playbackState</a> for example.
+      the preparation steps to be interrupted by {{MediaSessionAction/pause}}
+      action. See <a href="#example-set-playbackState">Setting playbackState</a>
+      for example.
     </p>
 
     <p>
@@ -304,7 +215,7 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     There could be multiple {{MediaSession}} objects existing at the same time
     since the user agent could have multiple tabs, each tab could contain a
     <a>top-level browsing context</a> and multiple <a>nested browsing
-    contexts</a>, and each <a>browsing context</a> could have a {{MediaSession}}
+    contexts</a>, and each [=/browsing context=] could have a {{MediaSession}}
     object.
 
     The user agent MUST select at most one of the {{MediaSession}} objects to
@@ -315,10 +226,10 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     routing. It only takes effect for the <a>active media session</a>.
 
     It is RECOMMENDED that the user agent selects the <a>active media
-    session</a> by managing <a>audio focus</a>. A tab or <a>browsing context</a>
-    is said to have <dfn>audio focus</dfn> if it is currently playing audio or
-    the user expects to control the media in it. The AudioFocus API targets this
-    area and could be used once it's finished.
+    session</a> by managing <a>audio focus</a>. A tab or [=Window/browsing
+    context=] is said to have <dfn>audio focus</dfn> if it is currently playing
+    audio or the user expects to control the media in it. The AudioFocus API
+    targets this area and could be used once it's finished.
 
     Whenever the <a>active media session</a> is changed, the user agent MUST run
     the <a>media session actions update algorithm</a> and the <a>update metadata
@@ -330,10 +241,9 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
 
     The media metadata for the <a>active media session</a> MAY be displayed in
     the platform UI depending on platform conventions. Whenever the <a>active
-    media session</a> changes or setting <a attribute
-    for="MediaSession"><code>metadata</code></a> of the <a>active media
-    session</a>, the user agent MUST run the <dfn>update metadata
-    algorithm</dfn>. The steps are as follows:
+    media session</a> changes or setting {{MediaSession/metadata}} of the
+    <a>active media session</a>, the user agent MUST run the <dfn>update
+    metadata algorithm</dfn>. The steps are as follows:
 
     <ol>
       <li>
@@ -341,17 +251,17 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
         presented to the platform, and terminate these steps.
       </li>
       <li>
-        If the <a attribute for="MediaSession"><code>metadata</code></a> of the
+        If the {{MediaSession/metadata}} of the
         <a>active media session</a> is an <a>empty metadata</a>, unset the media
         metadata presented to the platform, and terminate these steps.
       </li>
       <li>
-        Update the media metadata presented to the platform to match the <a
-        attribute for="MediaSession"><code>metadata</code></a> for the
+        Update the media metadata presented to the platform to match the
+        {{MediaSession/metadata}} for the
         <a>active media session</a>.
       </li>
       <li>
-        If the user agent wants to display an <a>artwork image</a>, it is
+        If the user agent wants to display an [=MediaMetadata/artwork image=], it is
         RECOMMENDED to run the <a>fetch image algorithm</a>.
       </li>
     </ol>
@@ -365,30 +275,27 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
         existing algorithm execution instances.
       </li>
       <li>
-        If <var>metadata</var>'s <a attribute
-        for="MediaMetadata"><code>artwork</code></a> of the <a>active media
-        session</a> is empty, then terminate these steps.
+        If <var>metadata</var>'s {{MediaMetadata/artwork}} of the <a>active
+        media session</a> is empty, then terminate these steps.
       </li>
       <li>
         If the platform supports displaying media artwork, select a
-        <dfn>preferred artwork image</dfn> from <var>metadata</var>'s <a
-        attribute for="MediaMetadata"><code>artwork</code></a> of the <a>active
-        media session</a>.
+        <dfn>preferred artwork image</dfn> from <var>metadata</var>'s
+        {{MediaMetadata/artwork}} of the <a>active media session</a>.
       </li>
       <li>
-        <a title="fetch">Fetch</a> the <a>preferred artwork image</a>'s
-        {{MediaImage/src}}.
+        [=Fetch=] the <a>preferred artwork image</a>'s {{MediaImage/src}}.
 
         Then, <a>in parallel</a>:
 
         <ol>
           <li>
-            Wait for the <a>response</a>.
+            Wait for the [=/response=].
           </li>
           <li>
-            If the <a>response</a>'s <a>internal response</a>'s <a lt="response
-            type">type</a> is <i>default</i>, attempt to decode the resource as
-            an image.
+            If the [=/response=]'s [=response/type=] is
+            {{ResponseType/"default"}}, attempt to decode the resource as an
+            image.
           </li>
           <li>
             If the image format is supported, use the image as the artwork for
@@ -414,10 +321,19 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     </p>
 
     <p>
-      A <dfn title='media session action source'>media session action
-      source</dfn> is a source that might produce a <a>media session action</a>.
-      Such a source can be the platform or the UI surfaces created by the user
-      agent.
+      A <dfn>media session action source</dfn> is a source that might produce a
+      <a>media session action</a>. Such a source can be the platform or the UI
+      surfaces created by the user agent.
+    </p>
+    <p>
+      A <a>media session action source</a> has an optional
+      <dfn for="media session action source">target</dfn> which should be the
+      recipient of any <a>media session action</a> created by the
+      <a>media session action source</a>. If a <a>media session action
+      source</a>'s
+      <a for="media session action source">target</a> is `null`, the <a>active
+      media session</a> is the recipient of all
+      <a>media session action source</a>'s actions.
     </p>
 
     <p>
@@ -425,45 +341,72 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
       which can have one of the following value:
       <ul>
         <li>
-          <dfn enum-value for=MediaSessionAction>play</dfn>: the action intent
+          <dfn enum-value for=MediaSessionAction>play</dfn>: the action's intent
           is to resume the playback.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>pause</dfn>: the action intent
-          is to pause the currently active playback.
+          <dfn enum-value for=MediaSessionAction>pause</dfn>: the action's
+          intent is to pause the currently active playback.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>seekbackward</dfn>: the action
-          intent is to move the playback time backward by a short period (eg. a
-          few seconds).
+          <dfn enum-value for=MediaSessionAction>seekbackward</dfn>: the
+          action's intent is to move the playback time backward by a short
+          period (eg. a few seconds).
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>seekforward</dfn>: the action
+          <dfn enum-value for=MediaSessionAction>seekforward</dfn>: the action's
           intent is to move the playback time forward by a short period (eg. a
           few seconds).
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>previoustrack</dfn>: the action
-          intent is to either start the current playback from the beginning if
-          the playback has a notion of beginning, or move to the previous item
-          in the playlist if the playback has a notion of playlist.
+          <dfn enum-value for=MediaSessionAction>previoustrack</dfn>: the
+          action's intent is to either start the current playback from the
+          beginning if the playback has a notion of beginning, or move to the
+          previous item in the playlist if the playback has a notion of
+          playlist.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>nexttrack</dfn>: the action is
-          to move to the playback to the next item in the playlist if the
-          playback has a notion of playlist.
+          <dfn enum-value for=MediaSessionAction>nexttrack</dfn>: the action's
+          intent is to move to the playback to the next item in the playlist if
+          the playback has a notion of playlist.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>skipad</dfn>: the action intent
-          is to skip the advertisement that is currently playing.
+          <dfn enum-value for=MediaSessionAction>skipad</dfn>: the action's
+          intent is to skip the advertisement that is currently playing.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>stop</dfn>: the action intent
+          <dfn enum-value for=MediaSessionAction>stop</dfn>: the action's intent
           is to stop the playback and clear the state if appropriate.
         </li>
         <li>
-          <dfn enum-value for=MediaSessionAction>seekto</dfn>: the action intent
-          is to move the playback time to a specific time.
+          <dfn enum-value for=MediaSessionAction>seekto</dfn>: the action's
+          intent is to move the playback time to a specific time.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>togglemicrophone</dfn>: the
+          action's intent is to mute or unmute the user's microphone.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>togglecamera</dfn>: the
+          action's intent is to turn the user's active camera on or off.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>hangup</dfn>: the action's
+          intent is to end a call.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>previousslide</dfn>: the
+          action's intent is to go back to the previous slide when presenting
+          slides.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>nextslide</dfn>: the action's
+          intent is to go to the next slide when presenting slides.
+        </li>
+        <li>
+          <dfn enum-value for=MediaSessionAction>enterpictureinpicture</dfn>:
+          the action's intent is to open the media session in a
+          picture-in-picture window.
         </li>
       </ul>
     </p>
@@ -480,7 +423,7 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
       is invoked, the user agent MUST run the following steps:
       <ol>
         <li>
-          If <var>handler</var> is <code>null</code>, remove <var>action</var>
+          If <var>handler</var> is `null`, remove <var>action</var>
           from the <a>supported media session actions</a> for {{MediaSession}}
           and abort these steps.
         </li>
@@ -501,17 +444,25 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
 
     <p>
       When the user agent is notified by a <a>media session action source</a>
-      that a
+      named <var>source</var> that a
       <a>media session action</a> named <var>action</var> has been triggered,
-      the user agent MUST run the <dfn>handle media session action</dfn> steps
-      as follows and consider it <a>triggered by user activation</a>:
+      the user agent MUST <a>queue a task</a>, using the [=user interaction task
+      source=], to run the following
+      <dfn>handle media session action</dfn> steps:
       <ol>
         <li>
-          If the <a>active media session</a> is <code>null</code>, abort these
-          steps.
+          Let <var>session</var> be <var>source</var>'s <a for="media session
+          action source">target</a>.
+        </li>
+        <li>
+          If <var>session</var> is `null`, set <var>session</var> to the
+          <a>active media session</a>.
         </li>
         <li>
-          Let <var>actions</var> be the <a>active media session</a>'s
+          If <var>session</var> is `null`, abort these steps.
+        </li>
+        <li>
+          Let <var>actions</var> be <var>session</var>'s
           <a>supported media session actions</a>.
         </li>
         <li>
@@ -524,20 +475,11 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
         </li>
         <li>
           Run <var>handler</var> with the <var>details</var> parameter set to:
-          <ul>
-            <li>
-              {{MediaSessionSeekActionDetails}} if <var>action</var> is
-              <a enum-value for=MediaSessionAction>seekbackward</a> or
-              <a enum-value for=MediaSessionAction>seekforward</a>.
-            </li>
-            <li>
-              {{MediaSessionSeekToActionDetails}} if <var>action</var> is
-              <a enum-value for=MediaSessionAction>seekto</a>.
-            </li>
-            <li>
-              Otherwise, with {{MediaSessionActionDetails}}.
-            </li>
-          </ul>
+          {{MediaSessionActionDetails}}.
+        </li>
+        <li>
+          Run the <a>activation notification</a> steps in the [=/browsing
+          context=] associated with <var>session</var>.
         </li>
       </ol>
     </p>
@@ -546,11 +488,11 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
       When the user agent receives a joint command for <a enum-value
       for=MediaSessionAction>play</a> and <a enum-value
       for=MediaSessionAction>pause</a>, such as a headset button click, it MUST
-      run the following steps:
+      <a>queue a task</a>, using the [=user interaction task source=], to run
+      the following steps:
       <ol>
         <li>
-          If the <a>active media session</a> is <code>null</code>, abort these
-          steps.
+          If the <a>active media session</a> is `null`, abort these steps.
         </li>
         <li>
           Let <var>action</var> be a <a>media session action</a>.
@@ -578,6 +520,23 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
       provided for the <a>active media session</a>.
     </p>
 
+    <p>
+      A user agent MAY implement a default handler for the <a enum-value
+      for=MediaSessionAction>togglemicrophone</a>, <a enum-value
+      for=MediaSessionAction>togglecamera</a>, or <a enum-value
+      for=MediaSessionAction>hangup</a> <a>media session actions</a> if none was
+      provided for the <a>active media session</a>.
+    </p>
+    <p>
+      A user agent MAY expose microphone and camera state to web pages via
+      {{MediaStreamTrack}}'s {{MediaStreamTrack/muted}} attribute in addition
+      to {{MediaSessionAction/togglemicrophone}} or
+      {{MediaSessionAction/togglecamera}} [=media session action=]. In that
+      case, the user agent MUST execute the corresponding
+      {{MediaSessionActionHandler}} before running, as different tasks, the
+      steps defined to [$set a track's muted state$].
+    </p>
+
     <p class=note>
       A page should only register a {{MediaSessionActionHandler}} for a <a>media
       session action</a> when it can handle the action given that the user agent
@@ -640,7 +599,7 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
   </section>
 
   <section>
-    <h3 id='position-state'>Position State</h3>
+    <h3 id='position-state-sec'>Position State</h3>
 
     <p>
       A user agent MAY display the <a>current playback position</a> and
@@ -673,7 +632,7 @@ conforming IDL fragments, as described in the Web IDL specification. [[!WEBIDL]]
     <p>
       The RECOMMENDED way to determine the <a>position state</a> is to monitor
       the media elements whose node document's browsing context is the
-      <a>browsing context</a>.
+      [=/browsing context=].
     </p>
 
     <p>
@@ -745,10 +704,16 @@ enum MediaSessionAction {
   "nexttrack",
   "skipad",
   "stop",
-  "seekto"
+  "seekto",
+  "togglemicrophone",
+  "togglecamera",
+  "hangup",
+  "previousslide",
+  "nextslide",
+  "enterpictureinpicture"
 };
 
-callback MediaSessionActionHandler = void(MediaSessionActionDetails details);
+callback MediaSessionActionHandler = undefined(MediaSessionActionDetails details);
 
 [Exposed=Window]
 interface MediaSession {
@@ -756,9 +721,13 @@ interface MediaSession {
 
   attribute MediaSessionPlaybackState playbackState;
 
-  void setActionHandler(MediaSessionAction action, MediaSessionActionHandler? handler);
+  undefined setActionHandler(MediaSessionAction action, MediaSessionActionHandler? handler);
+
+  undefined setPositionState(optional MediaPositionState state = {});
 
-  void setPositionState(optional MediaPositionState? state);
+  Promise&lt;undefined&gt; setMicrophoneActive(boolean active);
+
+  Promise&lt;undefined&gt; setCameraActive(boolean active);
 };
 </pre>
 
@@ -770,7 +739,7 @@ interface MediaSession {
 
 <p>
   A {{MediaSession}} has an associated <dfn for="MediaSession">metadata</dfn>
-  object represented by a {{MediaMetadata}}. It is initially <code>null</code>.
+  object represented by a {{MediaMetadata}}. It is initially `null`.
 </p>
 
 <p>
@@ -781,24 +750,21 @@ interface MediaSession {
 
 <p>
   The <dfn attribute for="MediaSession"><code>metadata</code></dfn> attribute
-  reflects the {{MediaSession}}'s <a for=MediaSession>metadata</a>. On getting,
-  it MUST return the {{MediaSession}}'s <a for=MediaSession>metadata</a>. On
-  setting, it MUST run the following steps with <var>value</var> being the new
-  value being set:
+  reflects the {{MediaSession}}'s {{MediaSession/metadata}}. On getting, it MUST
+  return the {{MediaSession}}'s {{MediaSession/metadata}}. On setting, it MUST
+  run the following steps with <var>value</var> being the new value being set:
   <ol>
     <li>
-      If the {{MediaSession}}'s <a for=MediaSession>metadata</a> is not
-      <code>null</code>, set its <a for=MediaMetadata>media session</a> to
-      <code>null</code>.
+      If the {{MediaSession}}'s {{MediaSession/metadata}} is not `null`, set its
+      [=MediaMetadata/media session=] to `null`.
     </li>
     <li>
-      Set the {{MediaSession}}'s <a for=MediaSession>metadata</a> to
+      Set the {{MediaSession}}'s {{MediaSession/metadata}} to
       <var>value</var>.
     </li>
     <li>
-      If the {{MediaSession}}'s <a for=MediaSession>metadata</a> is not
-      <code>null</code>, set its <a for=MediaMetadata>media session</a> to the
-      current {{MediaSession}}.
+      If the {{MediaSession}}'s {{MediaSession/metadata}} is not `null`, set its
+      [=MediaMetadata/media session=] to the current {{MediaSession}}.
     </li>
     <li>
       <a>In parallel</a>, run the <a>update metadata algorithm</a>.
@@ -809,14 +775,14 @@ interface MediaSession {
 <p>
   The <dfn attribute for="MediaSession"><code>playbackState</code></dfn>
   attribute represents the <dfn>declared playback state</dfn> of the <a>media
-  session</a>, by which the session declares whether its <a>browsing context</a>
+  session</a>, by which the session declares whether its [=/browsing context=]
   is playing media or not. The initial value is <a enum-value
   for="MediaSessionPlaybackState">none</a>. On setting, the user agent MUST set
   the IDL attribute to the new value if it is a valid
   {{MediaSessionPlaybackState}} value. On getting, the user agent MUST return
   the last valid value that was set. The {{MediaSession/playbackState}}
-  attribute is a hint for the user agent to determine whether the <a>browsing
-  context</a> is playing or paused.
+  attribute is a hint for the user agent to determine whether the [=/browsing
+  context=] is playing or paused.
 </p>
 
 <p class=note>
@@ -826,66 +792,67 @@ interface MediaSession {
 
 <p>
   The {{MediaSessionPlaybackState}} enum is used to indicate whether a
-  <a>browsing context</a> is playing media or not, the values are described as
+  [=/browsing context=] is playing media or not, the values are described as
   follows:
 
   <ul>
     <li>
       <dfn enum-value for="MediaSessionPlaybackState">none</dfn> means the
-      <a>browsing context</a>
-      does not specify whether it's playing or paused, it can only be used in
-      the {{MediaSession/playbackState}} attribute.
+      [=/browsing context=] does not specify whether it's playing or paused, it
+      can only be used in the {{MediaSession/playbackState}} attribute.
     </li>
     <li>
       <dfn enum-value for="MediaSessionPlaybackState">playing</dfn> means the
-      <a>browsing context</a> is currently playing media and it can be paused.
+      [=/browsing context=] is currently playing media and it can be paused.
     </li>
     <li>
       <dfn enum-value for="MediaSessionPlaybackState">paused</dfn> means the
-      <a>browsing context</a> has paused media and it can be resumed.
+      [=/browsing context=] has paused media and it can be resumed.
     </li>
   </ul>
 </p>
 
 <p>
-  The <dfn method for=MediaSession>setActionHandler()</dfn> method, when
-  invoked, MUST run the <a>update action handler algorithm</a> with
+  The <dfn method for=MediaSession>setActionHandler(action, handler)</dfn>
+  method, when invoked, MUST run the <a>update action handler algorithm</a> with
   <var>action</var> and <var>handler</var> on the {{MediaSession}}.
 </p>
 
 <p>
-  The <dfn method for=MediaSession>setPositionState()</dfn> method, when invoked
-  MUST perform the following steps:
+  The <dfn method for=MediaSession>setPositionState(|state|)</dfn> method, when
+  invoked MUST perform the following steps:
 
   <ul>
     <li>
-      If the <var>state</var> is a null or an empty dictionary then clear the
-      <a>position state</a>.
+      If <var>state</var> is an empty dictionary, clear the <a>position
+      state</a>
+      and abort these steps.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">duration</a> is not present
-      or its value is null, throw a <a exception>TypeError</a>.
+      If <var>state</var>'s <a dict-member for="MediaPositionState">duration</a>
+      is not present, throw a <a exception>TypeError</a>.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">duration</a> is negative,
-      throw a <a exception>TypeError</a>.
+      If <var>state</var>'s {{MediaPositionState/duration}} is negative or
+      <code>NaN</code>, throw a <a exception>TypeError</a>.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">position</a> is not present
-      or its value is null, set it to zero.
+      If <var>state</var>'s {{MediaPositionState/position}} is not present, set
+      it to zero.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">position</a> is negative or
-      greater than <a dict-member for="MediaPositionState">duration</a>, throw a
+      If <var>state</var>'s <a dict-member for="MediaPositionState">position</a>
+      is negative or greater than <a dict-member
+      for="MediaPositionState">duration</a>, throw a
       <a exception>TypeError</a>.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">playbackRate</a> is not
-      present or its value is null, set it to 1.0.
+      If <var>state</var>'s <a dict-member
+      for="MediaPositionState">playbackRate</a> is not present, set it to 1.0.
     </li>
     <li>
-      If the <a dict-member for="MediaPositionState">playbackRate</a> is zero
-      throw a <a exception>TypeError</a>.
+      If <var>state</var>'s {{MediaPositionState/playbackRate}} is zero, throw a
+      <a exception>TypeError</a>.
     </li>
     <li>
       Update the <a>position state</a> and <a>last position updated time</a>.
@@ -893,6 +860,139 @@ interface MediaSession {
   </ul>
 </p>
 
+<p>
+  The <dfn method for=MediaSession>setMicrophoneActive(active)</dfn> method
+  indicates to the user agent the microphone capture state desired by the page
+  (e.g. if the microphone is considered "inactive" by the page since it is no
+  longer sending audio through a call, the page can invoke
+  <code>setMicrophoneActive(false)</code>). When invoked, it MUST perform the
+  following steps:
+  <ol>
+    <li>
+      Let <var>document</var> be [=this=]'s [=relevant global object=]'s
+      [=associated Document=].
+    </li>
+    <li>
+      Let <var>captureKind</var> be "microphone".
+    </li>
+    <li>
+      Return the result of running the [=update capture state algorithm=] with
+      <var>document</var>, <var>active</var> and <var>captureKind</var>.
+    </li>
+  </ol>
+</p>
+<p>
+  Similarly, the <dfn method for=MediaSession>setCameraActive(active)</dfn>
+  method indicates to the user agent the camera capture state desired by the
+  page. When invoked, it MUST perform the following steps:
+  <ol>
+    <li>
+      Let <var>document</var> be [=this=]'s [=relevant global object=]'s
+      [=associated Document=].
+    </li>
+    <li>
+      Let <var>captureKind</var> be "camera".
+    </li>
+    <li>
+      Return the result of running the [=update capture state algorithm=] with
+      <var>document</var>, <var>active</var> and <var>captureKind</var>.
+    </li>
+  </ol>
+</p>
+<p>
+  The <dfn>update capture state algorithm</dfn>, when invoked with
+  <var>document</var>, <var>active</var> and <var>captureKind</var>, MUST
+  perform the following steps:
+  <ol>
+    <li>
+      If <var>document</var> is not [=fully active=], return [=a promise
+      rejected with=] <a exception>InvalidStateError</a>.
+    </li>
+    <li>
+      If <var>active</var> is <code>true</code> and <var>document</var>'s
+      [=Document/visibility state=] is not "visible", the user agent MAY return
+      [=a promise rejected with=] <a exception>InvalidStateError</a>.
+    </li>
+    <li>
+      Let <var>p</var> be a new promise.
+    </li>
+    <li>
+      <a>In parallel</a>, run the following steps:
+      <ol>
+        <li>
+          Let <var>applyPausePolicy</var> be <code>true</code> if the user agent
+          implements a policy of <dfn>pausing all input sources</dfn> of type
+          <var>captureKind</var> in response to UI and <code>false</code>
+          otherwise.
+        </li>
+        <li>
+          If <var>applyPausePolicy</var> is <code>true</code>, run the following
+          substeps:
+          <ol>
+            <li>
+              Let <var>currentlyActive</var> be <code>false</code> if the user
+              agent is currently [=pausing all input sources=] of type
+              <var>captureKind</var>
+              and <code>true</code> otherwise.
+            </li>
+            <li>
+              If <var>active</var> is <var>currentlyActive</var>, resolve
+              <var>p</var> with <code>undefined</code> and abort these steps.
+            </li>
+            <li>
+              If <var>active</var> is <code>true</code>, the user agent MAY wait
+              to proceed, for instance to prompt the user.
+            </li>
+            <li>
+              If the user agent denies the request to update the capture state,
+              reject <var>p</var> with a <a exception>NotAllowedError</a> and
+              abort these steps.
+            </li>
+          </ol>
+        </li>
+        <li>
+          Update the user agent capture state UI according to
+          <var>captureKind</var>
+          and <var>active</var>.
+        </li>
+        <li>Resolve <var>p</var> with <code>undefined</code>.</li>
+        <li>
+          If <var>applyPausePolicy</var> is <code>true</code>, run the following
+          substeps:
+          <ol>
+            <li>
+              Let <var>newMutedState</var> be <code>true</code> if
+              <var>active</var> is
+            <code>false</code> and <code>false</code> otherwise.</li>
+            <li>
+              For each {{MediaStreamTrack}} whose source is of type
+              <var>captureKind</var>,
+              <a>queue a task</a> to [$set a track's muted state$] to
+              <var>newMutedState</var>.
+            </li>
+          </ol>
+        </li>
+      </ol>
+    </li>
+    <li>
+      Return <var>p</var>.
+    </li>
+  </ol>
+</p>
+<p class=note>
+  Both the <a>setMicrophoneActive(active)</a> and <a>setCameraActive(active)</a>
+  methods can reject based on user agent specific heuristics. This might in
+  particular happen when the web page asks to activate (aka unmute) microphone
+  or camera. The user agent could decide to require [=transient activation=] in
+  that case. It might also require user input through a prompt to make the
+  actual decision.
+</p>
+
+<p>
+  The user agent MAY display UI which invokes handlers for
+  <a>media session actions</a>.
+</p>
+
 <h2 id="the-mediametadata-interface">The {{MediaMetadata}} interface</h2>
 
 <pre class="idl">
@@ -903,7 +1003,8 @@ interface MediaMetadata {
   attribute DOMString title;
   attribute DOMString artist;
   attribute DOMString album;
-  attribute FrozenArray&lt;object> artwork;
+  attribute FrozenArray&lt;MediaImage> artwork;
+  [SameObject] readonly attribute FrozenArray&lt;ChapterInformation> chapterInfo;
 };
 
 dictionary MediaMetadataInit {
@@ -911,6 +1012,7 @@ dictionary MediaMetadataInit {
   DOMString artist = "";
   DOMString album = "";
   sequence&lt;MediaImage> artwork = [];
+  sequence&lt;ChapterInformationInit> chapterInfo = [];
 };
 </pre>
 
@@ -937,21 +1039,27 @@ dictionary MediaMetadataInit {
   but a list of type {{MediaImage}} internally.
 </p>
 
+<p>
+  A {{MediaMetadata}} has an associated list of <dfn for="MediaMetadata">
+  chapter information</dfn>.
+</p>
+
 <p>
   A {{MediaMetadata}} is said to be an <dfn>empty metadata</dfn> if it is equal
-  to <code>null</code> or all the following conditions are true:
+  to `null` or all the following conditions are true:
   <ul>
     <li>Its <a for=MediaMetadata>title</a> is the empty string.</li>
     <li>Its <a for=MediaMetadata>artist</a> is the empty string.</li>
     <li>Its <a for=MediaMetadata>album</a> is the empty string.</li>
     <li>Its <a for=MediaMetadata title='artwork image'>artwork images</a> length
     is <code>0</code>.</li>
+    <li>Its <a for=MediaMetadata>chapter information</a> length is
+    <code>0</code>.</li>
   </ul>
 </p>
 
 <p>
-  The <dfn constructor
-  for="MediaMetadata"><code>MediaMetadata(<var>init</var>)</code></dfn>
+  The <dfn constructor for="MediaMetadata">MediaMetadata(<var>init</var>)</dfn>
   constructor, when invoked, MUST run the following steps:
 
   <ol>
@@ -977,6 +1085,20 @@ dictionary MediaMetadataInit {
       and set <var>metadata</var>'s <a for="MediaMetadata">artwork images</a>
       as the result if it succeeded.
     </li>
+    <li>
+      Let <var>chapters</var> be an empty list of type {{ChapterInformation}}.
+    </li>
+    <li>
+      For each <var>entry</var> in <var>init</var>'s
+      {{MediaMetadataInit/chapterInfo}}, [=create a ChapterInformation=] from
+      <var>entry</var> and append it to
+      <var>chapters</var>.
+    </li>
+    <li>
+      Set <var>metadata</var>'s <a for="MediaMetadata">chapter information</a>
+      to the result of [=Create a frozen array|creating a frozen array=] from
+      <var>chapters</var>.
+    </li>
     <li>
       Return <var>metadata</var>.
     </li>
@@ -991,8 +1113,8 @@ the user agent MUST run the following steps:
     Let <var>output</var> be an empty list of type {{MediaImage}}.
   </li>
   <li>
-    For each <var>entry</var> in <var>input</var>'s
-    {{MediaMetadataInit/artwork}}, perform the following steps:
+    For each <var>entry</var> in <var>input</var> (which is a {{MediaImage}}
+    list), perform the following steps:
     <ol>
       <li>
         Let <var>image</var> be a new {{MediaImage}}.
@@ -1024,31 +1146,29 @@ the user agent MUST run the following steps:
 </ol>
 
 <p>
-  The <dfn attribute for="MediaMetadata"><code>title</code></dfn> attribute
-  reflects the {{MediaMetadata}}'s <a for=MediaMetadata>title</a>. On getting,
-  it MUST return the {{MediaMetadata}}'s <a for=MediaMetadata>title</a>. On
-  setting, it MUST set the {{MediaMetadata}}'s <a for=MediaMetadata>title</a> to
-  the given value.
+  The <dfn attribute for="MediaMetadata">title</dfn> attribute reflects the
+  {{MediaMetadata}}'s <a for=MediaMetadata>title</a>. On getting, it MUST return
+  the {{MediaMetadata}}'s <a for=MediaMetadata>title</a>. On setting, it MUST
+  set the {{MediaMetadata}}'s <a for=MediaMetadata>title</a> to the given value.
 </p>
 
 <p>
-  The <dfn attribute for="MediaMetadata"><code>artist</code></dfn> attribute
-  reflects the {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>. On getting,
-  it MUST return the {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>. On
-  setting, it MUST set the {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>
+  The <dfn attribute for="MediaMetadata">artist</dfn> attribute reflects the
+  {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>. On getting, it MUST
+  return the {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>. On setting, it
+  MUST set the {{MediaMetadata}}'s <a for=MediaMetadata>artist</a>
   to the given value.
 </p>
 
 <p>
-  The <dfn attribute for="MediaMetadata"><code>album</code></dfn> attribute
-  reflects the {{MediaMetadata}}'s <a for=MediaMetadata>album</a>. On getting,
-  it MUST return the {{MediaMetadata}}'s <a for=MediaMetadata>album</a>. On
-  setting, it MUST set the {{MediaMetadata}}'s <a for=MediaMetadata>album</a> to
-  the given value.
+  The <dfn attribute for="MediaMetadata">album</dfn> attribute reflects the
+  {{MediaMetadata}}'s <a for=MediaMetadata>album</a>. On getting, it MUST return
+  the {{MediaMetadata}}'s <a for=MediaMetadata>album</a>. On setting, it MUST
+  set the {{MediaMetadata}}'s <a for=MediaMetadata>album</a> to the given value.
 </p>
 
 <p>
-  The <dfn attribute for="MediaMetadata"><code>artwork</code></dfn>
+  The <dfn attribute for="MediaMetadata">artwork</dfn>
   attribute reflects the {{MediaMetadata}}'s <a for="MediaMetadata">artwork
   images</a>. On getting, it MUST return the result of the following steps:
   <ol>
@@ -1084,8 +1204,8 @@ the user agent MUST run the following steps:
         better to do this with IDL primitives instead of JS - see
         https://www.w3.org/Bugs/Public/show_bug.cgi?id=29004 -->
         <li>
-          Call <a lt="freeze">Object.freeze</a> on the <var>object</var>,
-          to prevent accidental mutation by scripts.
+          Call {{Object/freeze(O)}} on <var>image</var>, to prevent accidental
+          mutation by scripts.
         </li>
         <li>
           Append the <var>object</var> to <var>frozenArtwork</var>.
@@ -1117,8 +1237,8 @@ the user agent MUST run the following steps:
   following steps:
   <ol>
     <li>
-      If the instance has no associated <a for=MediaMetadata>media session</a>,
-      abort these steps.
+      If the instance has no associated [=MediaMetadata/media session=], abort
+      these steps.
     </li>
     <li>
       Otherwise, <a>queue a task</a> to run the following substeps:
@@ -1136,6 +1256,108 @@ the user agent MUST run the following steps:
   </ol>
 </p>
 
+<h2 id="the-chapterinformation-interface">The {{ChapterInformation}}
+interface</h2>
+
+<pre class="idl">
+[Exposed=Window]
+interface ChapterInformation {
+  readonly attribute DOMString title;
+  readonly attribute double startTime;
+  [SameObject] readonly attribute FrozenArray&lt;MediaImage> artwork;
+};
+
+dictionary ChapterInformationInit {
+  DOMString title = "";
+  double startTime = 0;
+  sequence&lt;MediaImage> artwork = [];
+};
+
+</pre>
+
+<p>
+  A {{ChapterInformation}} object is a representation of metadata for an
+  individual chapter, such as the title of the section, its timestamp, and
+  screenshot image data of this section, that can be used by user agents to
+  provide a customized user interface.
+</p>
+
+<p>
+  A {{ChapterInformation}} can have an associated <dfn for="ChapterInformation">
+  media metadata</dfn>.
+</p>
+
+<p>
+  A {{ChapterInformation}} has an associated <dfn
+  for="ChapterInformation">title</dfn>
+  which is DOMString.
+</p>
+
+<p>
+  A {{ChapterInformation}} has an associated <dfn for="ChapterInformation">
+  startTime</dfn> which is double.
+</p>
+
+<p>
+  A {{ChapterInformation}} has an associated list of <dfn
+  for="ChapterInformation">
+  artwork images</dfn>.
+</p>
+
+<p>
+  To <dfn>create a {{ChapterInformation}}</dfn> with <var>init</var>, run the
+  following steps:
+
+  <ol>
+    <li>
+      Let <var>chapterInfo</var> be a new {{ChapterInformation}} object.
+    </li>
+    <li>
+      Set <var>chapterInfo</var>'s {{ChapterInformation/title}} to
+      <var>init</var>'s {{ChapterInformationInit/title}}.
+    </li>
+    <li>
+      Set <var>chapterInfo</var>'s {{ChapterInformation/startTime}} to
+      <var>init</var>'s {{ChapterInformationInit/startTime}}. If the <a
+      for=ChapterInformation>startTime</a> is negative or greater than
+      [=duration=], throw a <a exception>TypeError</a>.
+    </li>
+    <li>
+      Let {{ChapterInformationInit/artwork}} be the result of running the
+      <a>convert artwork algorithm</a>.
+    </li>
+    <li>
+      Set <var>chapterInfo</var>'s <a for="ChapterInformation">artwork
+      images</a> to the result of [=Create a frozen array|creating a frozen
+      array=] from {{ChapterInformationInit/artwork}}.
+    </li>
+    <li>
+      Return <var>chapterInfo</var>.
+    </li>
+  </ol>
+</p>
+
+<p>
+  The <dfn attribute for="ChapterInformation">title</dfn> attribute reflects the
+  {{ChapterInformation}}'s <a for=ChapterInformation>title</a>. On getting, it
+  MUST return the {{ChapterInformation}}'s <a for=ChapterInformation>title</a>.
+</p>
+
+<p>
+  The <dfn attribute for="ChapterInformation">startTime</dfn> attribute reflects
+  the {{ChapterInformation}}'s <a for=ChapterInformation>startTime</a> in
+  seconds. On getting, it MUST return the {{ChapterInformation}}'s <a
+  for=ChapterInformation>startTime</a>.
+</p>
+
+<p>
+  The <dfn attribute for="ChapterInformation">artwork</dfn>
+  attribute reflects the {{ChapterInformation}}'s <a
+  for="ChapterInformation">artwork images</a>. On getting, it MUST return the
+  {{ChapterInformation}}'s <a for=ChapterInformation>
+  artwork images</a>.
+</p>
+
 <h2 id="the-mediaimage-dictionary">The {{MediaImage}} dictionary</h2>
 
 <pre class="idl">
@@ -1147,22 +1369,21 @@ dictionary MediaImage {
 };
 </pre>
 
-The {{MediaImage}} dictionary members are inspired by the <a lt="image
-object">image objects</a> in Web App Manifest.
+<p class="informative">The {{MediaImage}} dictionary members are inspired by
+{{ImageResource}} in [[IMAGE-RESOURCE]].</p>
 
 The <dfn dict-member for="MediaImage">src</dfn> <a>dictionary member</a> is used
-to specify the {{MediaImage}} object's <dfn for="MediaImage">source</dfn>. It is
-a URL from which the user agent can fetch the image's data.
+to specify the {{MediaImage}} object's <dfn attribute
+for="MediaImage">source</dfn>. It is a URL from which the user agent can fetch
+the image's data.
 
 The <dfn dict-member for="MediaImage">sizes</dfn> <a>dictionary member</a> is
 used to specify the {{MediaImage}} object's {{MediaImage/sizes}}. It follows the
-spec of <a attribute for="HTMLLinkElement"><code>sizes</code></a> attribute in
-the HTML
-<a for="HTMLLinkElement"><code>link</code></a> element, which is a string
-consisting of an <a>unordered set of unique space-separated tokens</a> which are
-<a>ASCII case-insensitive</a> that represents the dimensions of an image. Each
-keyword is either an <a>ASCII case-insensitive</a> match for the string "any",
-or a value that consists of two valid non-negative integers that do not have a
+spec of <{link/sizes}> attribute in the HTML <{link}> element, which is a string
+consisting of an [=unordered set of unique space-separated tokens=] which are
+[=ASCII case-insensitive=] that represents the dimensions of an image. Each
+keyword is either an [=ASCII case-insensitive=] match for the string "any", or a
+value that consists of two valid non-negative integers that do not have a
 leading U+0030 DIGIT ZERO (0) character and that are separated by a single
 U+0078 LATIN SMALL LETTER X or U+0058 LATIN CAPITAL LETTER X character. The
 keywords represent icon sizes in raw pixels (as opposed to CSS pixels). When
@@ -1183,7 +1404,7 @@ dictionary</h2>
 <pre class="idl">
 
 dictionary MediaPositionState {
-  double duration;
+  unrestricted double duration;
   double playbackRate;
   double position;
 };
@@ -1221,38 +1442,81 @@ dictionary MediaSessionActionDetails {
 };
 
 dictionary MediaSessionSeekActionDetails : MediaSessionActionDetails {
-  double? seekOffset;
+  double seekOffset;
 };
 
 dictionary MediaSessionSeekToActionDetails : MediaSessionActionDetails {
   required double seekTime;
-  boolean? fastSeek;
+  boolean fastSeek;
 };
+
+dictionary MediaSessionCaptureActionDetails : MediaSessionActionDetails {
+  boolean isActivating;
+};
+
 </pre>
 
 The {{MediaSessionActionHandler}} MUST be run with the <var>details</var>
-parameter which is represented by a dictionary inherited from
-{{MediaSessionActionDetails}}.
-
-The <dfn dict-member for="MediaSessionActionDetails">action</dfn> <a>dictionary
-member</a>
-is used to specify the <a>action</a> that the {{MediaSessionActionHandler}} is
-associated with.
+parameter whose dictionary type is:
+<ul>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/play}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/pause}}.</li>
+  <li>{{MediaSessionSeekActionDetails}} for
+  {{MediaSessionAction/seekbackward}}.</li>
+  <li>{{MediaSessionSeekActionDetails}} for
+  {{MediaSessionAction/seekforward}}.</li>
+  <li>{{MediaSessionActionDetails}} for
+  {{MediaSessionAction/previoustrack}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/nexttrack}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/skipad}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/stop}}.</li>
+  <li>{{MediaSessionSeekToActionDetails}} for
+  {{MediaSessionAction/seekto}}.</li>
+  <li>{{MediaSessionCaptureActionDetails}} for
+  {{MediaSessionAction/togglemicrophone}}.</li>
+  <li>{{MediaSessionCaptureActionDetails}} for
+  {{MediaSessionAction/togglecamera}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/hangup}}.</li>
+  <li>{{MediaSessionActionDetails}} for
+  {{MediaSessionAction/previousslide}}.</li>
+  <li>{{MediaSessionActionDetails}} for {{MediaSessionAction/nextslide}}.</li>
+  <li>{{MediaSessionActionDetails}} for
+  {{MediaSessionAction/enterpictureinpicture}}.</li>
+</ul>
+
+The <dfn dict-member for="MediaSessionActionDetails">action</dfn>
+<a>dictionary member</a> is used to specify the <a>media session action</a>
+that the {{MediaSessionActionHandler}} is associated with.
 
 The <dfn dict-member for="MediaSessionSeekActionDetails">seekOffset</dfn>
-<a>dictionary member</a> MAY be provided and is the time in seconds to move the
-playback time by. If it is not provided then the site should choose a sensible
-time (e.g. a few seconds).
+<a>dictionary member</a> is the time in seconds to move the playback time by. If
+present, it should always be positive. If it is not provided then the site
+should choose a sensible time (e.g. a few seconds).
 
 The <dfn dict-member for="MediaSessionSeekToActionDetails">seekTime</dfn>
-<a>dictionary member</a> MUST be provided and is the time in seconds to move the
-playback time to.
+<a>dictionary member</a> is the time in seconds to move the playback time to.
+
+The <dfn dict-member for="MediaSessionActionSeekToDetails">fastSeek</dfn>
+<a>dictionary member</a> will be true if the seek [=media session
+action|action=] is being called multiple times as part of a sequence and this is
+not the last call in that sequence.
+
+The <dfn dict-member for="MediaSessionActionCaptureDetails">isActivating</dfn>
+<a>dictionary member</a> will be <code>false</code> if the user agent is about
+to [=pausing all input sources|pause all input sources=] related to the capture
+[=media session action|action=] and <code>true</code> otherwise. This
+<a>dictionary member</a> MUST be present if the user agent implements a policy
+of [=pausing all input sources=].
 
-The <dfn dict-member for="MediaSessionSeekToActionDetails">fastSeek</dfn>
-<a>dictionary member</a> MAY be provided and will be true if the
-<a enum-value for=MediaSessionAction>seekto</a> <a>action</a> is being called
-multiple times as part of a sequence and this is not the last call in that
-sequence.
+<h2 id="permissions-policy">Permissions Policy Integration</h2>
+
+This specification defines a [=policy-controlled feature=] identified by the
+string "mediasession". Its [=default allowlist=] is [=default allowlist/*=].
+
+A document's <a>permissions policy</a> determines whether any content in that
+document is allowed to use the MediaSession API. If disabled in the document,
+the User Agent MUST NOT select the document's media session as the <a>active
+media session</a>.
 
 <h2 id="examples">Examples</h2>
 
@@ -1266,14 +1530,19 @@ sequence.
       title: "Episode Title",
       artist: "Podcast Host",
       album: "Podcast Title",
-      artwork: [{src: "podcast.jpg"}]
+      artwork: [{src: "podcast.jpg"}],
+      chapterInfo: [
+        {title: "Chapter 1", startTime: 0, artwork: [{src: "chapter1.jpg"}]},
+        {title: "Chapter 2", startTime: 120, artwork: [{src: "chapter2.jpg"}]}
+      ]
     });
   </pre>
 
   Alternatively, providing multiple <a for="MediaMetadata" title="artwork
   image">artwork images</a> in the metadata can let the user agent be able to
   select different artwork images for different display purposes and better fit
-  for different screens:
+  for different screens (the same for the artwork in
+  {{MediaMetadata/chapterInfo}}):
 
   <pre class="lang-javascript">
     navigator.mediaSession.metadata = new MediaMetadata({
@@ -1287,23 +1556,32 @@ sequence.
         {src: "podcast.png", sizes: "128x128", type: "image/png"},
         {src: "podcast_hd.png", sizes: "256x256", type: "image/png"},
         {src: "podcast.ico", sizes: "128x128 256x256", type: "image/x-icon"}
+      ],
+      chapterInfo: [
+        {title: "Chapter 1", startTime: 0, artwork: [
+           {src: "chapter1_a.jpg", sizes: "128x128", type: "image/jpeg"},
+           {src: "chapter1_b.png", sizes: "256x256", type: "image/png"}
+         ]},
+        {title: "Chapter 2", startTime: 120, artwork: [
+           {src: "chapter2_a.jpg", sizes: "128x128", type: "image/jpeg"},
+           {src: "chapter2_b.png", sizes: "256x256", type: "image/png"}
+         ]}
       ]
     });
   </pre>
 
   For example, if the user agent wants to use an image as icon, it may choose
-  <code>"podcast.jpg"</code> or <code>"podcast.png"</code> for a
-  low-pixel-density screen, and <code>"podcast_hd.jpg"</code>
-  or <code>"podcast_hd.png"</code> for a high-pixel-density screen. If the user
-  agent wants to use an image for lockscreen background,
-  <code>"podcast_xhd.jpg"</code> will be preferred.
+  `"podcast.jpg"` or `"podcast.png"` for a low-pixel-density screen, and
+  `"podcast_hd.jpg"` or `"podcast_hd.png"` for a high-pixel-density screen. If
+  the user agent wants to use an image for lockscreen background,
+  `"podcast_xhd.jpg"` will be preferred.
 
 </div>
 
 <div class="example" id="example-changing-metadata">
-  Changing <a for=MediaSession>metadata</a>:
+  Changing [=MediaSession/metadata=]:
 
-  For playlists or chapters of an audio book, multiple <a>media elements</a> can
+  For playlists or chapters of an audio book, multiple [=media elements=] can
   share a single <a>media session</a>.
 
   <pre class="lang-javascript">
@@ -1346,7 +1624,7 @@ sequence.
     var audio = document.createElement("audio");
     audio.src = tracks[trackId];
 
-    void updatePlayingMedia() {
+    function updatePlayingMedia() {
       audio.src = tracks[trackId];
       // Update metadata (omitted)
     }
@@ -1454,6 +1732,67 @@ sequence.
   </pre>
 </div>
 
+<div class="example" id="example-microphone-camera-hangup">
+  Using video conferencing actions:
+  <pre class="lang-javascript">
+    var isMicrophoneActive = false;
+    var isCameraActive = false;
+
+    navigator.mediaSession.setMicrophoneActive(isMicrophoneActive);
+    navigator.mediaSession.setCameraActive(isCameraActive);
+
+    navigator.mediaSession.setActionHandler("togglemicrophone", function() {
+      if (isMicrophoneActive) {
+        // Mute the microphone. Implementation omitted.
+      } else {
+        // Unmute the microphone. Implementation omitted.
+      }
+      isMicrophoneActive = !isMicrophoneActive;
+      navigator.mediaSession.setMicrophoneActive(isMicrophoneActive);
+    });
+
+    navigator.mediaSession.setActionHandler("togglecamera", function() {
+      if (isCameraActive) {
+        // Disable the camera. Implementation omitted.
+      } else {
+        // Enable the camera. Implementation omitted.
+      }
+      isCameraActive = !isCameraActive;
+      navigator.mediaSession.setCameraActive(isCameraActive);
+    });
+
+    navigator.mediaSession.setActionHandler("hangup", function() {
+      // End the call. Implementation omitted.
+    });
+  </pre>
+</div>
+
+<div class="example" id="example-presenting-slide-actions">
+  Handling presenting slide actions:
+  <pre class="lang-javascript">
+    var currentSlideIndex = 0;
+
+    navigator.mediaSession.setActionHandler("previousslide", function() {
+      currentSlideIndex--;
+      // Set current slide. Implementation omitted.
+    });
+
+    navigator.mediaSession.setActionHandler("nextslide", function() {
+      currentSlideIndex++;
+      // Set current slide. Implementation omitted.
+    });
+  </pre>
+</div>
+
+<div class="example" id="example-enterpictureinpicture">
+  Handling picture-in-picture:
+  <pre class="lang-javascript">
+    navigator.mediaSession.setActionHandler("enterpictureinpicture", function() {
+      remoteVideo.requestPictureInPicture();
+    });
+  </pre>
+</div>
+
 <h2 id="acknowledgments" class="no-num">Acknowledgments</h2>
 
 The editors would like to thank Paul Adenot, Jake Archibald, Tab Atkins,
@@ -1468,5 +1807,3 @@ patience in working through the initial design issues; Jer Noble for his help in
 building a model that also works well within the iOS audio focus model; and
 Mounir Lamouri and Anton Vayvod for their early involvement, feedback and
 support in making this specification happen.
-
-<script id=head src=https://resources.whatwg.org/dfn.js></script>