GH Task Runner (Large Suite) #7
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: GH Task Runner (Large Suite) | |
on: | |
workflow_dispatch: | |
inputs: | |
approval_notice: | |
description: 'WARNING: This will spin up a large number of tasks - get approval from admin before running' | |
required: false | |
default: 'NOT_APPROVED' | |
type: choice | |
options: | |
- NOT_APPROVED | |
- APPROVED | |
model_hf_repo: | |
description: 'Model Hugging Face Repository' | |
required: true | |
default: 'RWKV/rwkv-5-world-1b5' | |
model_args: | |
description: 'Model Arguments (ie: dtype="fp16")' | |
required: false | |
default: 'trust_remote_code=True' | |
batch_size: | |
description: 'Batch Size' | |
required: true | |
default: 'auto' | |
backend: | |
description: 'Backend to use' | |
required: true | |
default: 'nvidia-gpu' | |
type: choice | |
options: | |
- nvidia-gpu | |
- intel-gpu | |
- amd-gpu | |
- any-gpu | |
gpu_vram: | |
description: 'Minimum GPU VRAM (ignored for MPS)' | |
required: true | |
default: '24' | |
type: choice | |
options: | |
- 16 | |
- 24 | |
- 40 | |
- 48 | |
- 80 | |
num_fewshot: | |
description: 'num_fewshot setting (ignored if < 0)' | |
required: true | |
default: -1 | |
env: | |
# Get the final task | |
RUN_TASK: ${{ github.event.inputs.custom_task || github.event.inputs.run_task }} | |
# HF repo to sync to | |
HF_REPO_SYNC: rwkv-x-dev/lm-eval-output | |
# Model HF repo | |
MODEL_HF_REPO: ${{ github.event.inputs.model_hf_repo }} | |
# Secrets | |
HUGGING_FACE_HUB_TOKEN: ${{secrets.HUGGING_FACE_HUB_TOKEN}} | |
jobs: | |
gh-task-runner-large-suite-1: | |
# Check for approval notice | |
if: ${{ github.event.inputs.approval_notice == 'APPROVED' }} | |
# Strategy Matrix | |
strategy: | |
# Disable fail-fast behavior | |
fail-fast: false | |
matrix: | |
# NOTE: There is a matrix limit of 256 on github | |
run_task: | |
### Medium Slow tasks (>=15 mins on 4x3090) | |
### ---------------------------------------------------------------------------- | |
- triviaqa | |
- record | |
- glue | |
- gsm8k | |
- kmmlu | |
- nq_open | |
- qqp | |
- pythia | |
# - kmmlu_* | |
### Faster tasks (<= 15 mins on 4x3090) | |
### ---------------------------------------------------------------------------- | |
- anli | |
# - anli_* | |
- ai2_arc | |
# - arc_easy | |
# - arc_challenge | |
- arithmetic | |
- blimp | |
# - blimp_* | |
- boolq | |
- cb | |
- ceval-valid | |
# - ceval-valid_* | |
- cmmlu | |
# - cmmlu_* | |
- cola | |
- copa | |
- crows_pairs | |
# - crows_pairs_* | |
- freebase | |
- hellaswag | |
- kobest | |
# - kobest_* | |
- lambada | |
- lambada_cloze | |
# - lambada_* | |
- logieval | |
- logiqa | |
- logiqa2 | |
- loglikelihood | |
- mathqa | |
- mc_taco | |
- medmcqa | |
- medqa_4options | |
- mgsm_* | |
- mmlu | |
# - mmlu_* | |
- mnli | |
- mnli_mismatch | |
- mrpc | |
- multimedqa | |
- multiple_choice | |
- multirc | |
- mutual | |
- mutual_plus | |
- openbookqa | |
- piqa | |
- prost | |
- pubmedqa | |
- qa4mre | |
# - qa4mre_* | |
- qnli | |
- race | |
- rte | |
- sciq | |
- sglue_rte | |
- sst2 | |
- swag | |
- sycophancy | |
# - sycophancy_on_* | |
- truthfulqa | |
# - truthfulqa_* | |
- webqs | |
- wic | |
- wikitext | |
- winogrande | |
- wnli | |
- wsc | |
- wsc273 | |
# Name of the job | |
name: "[${{ matrix.run_task }}] ${{ github.event.inputs.model_hf_repo }} - ${{ github.event.inputs.model_args }}" | |
# Due to github worker hard limitation, of 24 hours | |
# we apply a timeout of 23 hours instead. | |
timeout-minutes: 1380 | |
# Select the type of runner that the job will run on | |
runs-on: | |
- ${{ github.event.inputs.backend }} | |
- gpu-vram-${{ github.event.inputs.gpu_vram }} | |
# - gpu-count-any | |
# Actual task setup, and run steps | |
steps: | |
- name: Checkout repository | |
uses: actions/checkout@v3 | |
- name: Run the task | |
uses: ./.github/actions/gh-task-runner-composite | |
with: | |
run_task: ${{ matrix.run_task }} | |
num_fewshot: ${{ github.event.inputs.num_fewshot }} | |
model_hf_repo: ${{ github.event.inputs.model_hf_repo }} | |
model_args: ${{ github.event.inputs.model_args }} | |
batch_size: ${{ github.event.inputs.batch_size }} | |
# upload_to_hf: False | |