File tree Expand file tree Collapse file tree 2 files changed +11
-6
lines changed Expand file tree Collapse file tree 2 files changed +11
-6
lines changed Original file line number Diff line number Diff line change @@ -3,6 +3,14 @@ name: Benchmark v2 Framework
33on :
44 workflow_call :
55 inputs :
6+ runner_group :
7+ description : ' GH Actions runner group to use'
8+ required : false
9+ type : string
10+ runner_label :
11+ description : ' GH Actions runner label to use'
12+ required : false
13+ type : string
614 model_id :
715 description : ' Model ID to benchmark (e.g., meta-llama/Llama-2-7b-hf)'
816 required : false
5462jobs :
5563 benchmark-v2 :
5664 name : Benchmark v2
57- strategy :
58- matrix :
59- # Use GPU-enabled runners for accurate benchmarking
60- group : [aws-g5-4xlarge-cache]
6165 runs-on :
62- group : ${{ matrix.group }}
66+ group : ${{ inputs.runner_group }}
67+ label : ${{ inputs.runner_label }}
6368 container :
6469 image : huggingface/transformers-pytorch-gpu
6570 options : --gpus all --privileged --ipc host --shm-size "16gb"
Original file line number Diff line number Diff line change 1212 model_id :
1313 description : ' Model ID to benchmark (leave empty for default models)'
1414 required : false
15- type : string
1615 default : ' '
1716 warmup_iterations :
1817 description : ' Number of warmup iterations'
4746 name : Benchmark v2 - Default Models
4847 uses : ./.github/workflows/benchmark_v2.yml
4948 with :
49+ runner_group : " aws-g5-4xlarge-cache"
5050 model_id : ${{ inputs.model_id || '' }}
5151 warmup_iterations : ${{ inputs.warmup_iterations || 3 }}
5252 measurement_iterations : ${{ inputs.measurement_iterations || 5 }}
You can’t perform that action at this time.
0 commit comments