Choosing input/total tokens automatically based on available VRAM? #211

	name: Build PR Documentation

	on:
	pull_request:
	paths:
	- "docs/source/**"

	concurrency:
	group: ${{ github.workflow }}-${{ github.head_ref \|\| github.run_id }}
	cancel-in-progress: true

	jobs:
	build:
	uses: huggingface/doc-builder/.github/workflows/build_pr_documentation.yml@main
	with:
	commit_sha: ${{ github.event.pull_request.head.sha }}
	pr_number: ${{ github.event.number }}
	package: text-generation-inference
	additional_args: --not_python_module

Provide feedback