Skip to content

Commit dc1111f

Browse files
committed
add parakeet into cuda benckmark ci
as title Differential Revision: [D92208958](https://our.internmc.facebook.com/intern/diff/D92208958/) ghstack-source-id: 338027440 Pull Request resolved: #17182
1 parent 593775b commit dc1111f

File tree

1 file changed

+14
-1
lines changed

1 file changed

+14
-1
lines changed

.github/workflows/cuda-perf.yml

Lines changed: 14 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ jobs:
6161
shell: bash
6262
env:
6363
# All available models and quantizations
64-
ALL_MODELS: 'mistralai/Voxtral-Mini-3B-2507,openai/whisper-small,openai/whisper-medium,openai/whisper-large-v3-turbo,google/gemma-3-4b-it'
64+
ALL_MODELS: 'mistralai/Voxtral-Mini-3B-2507,openai/whisper-small,openai/whisper-medium,openai/whisper-large-v3-turbo,google/gemma-3-4b-it,nvidia/parakeet-tdt'
6565
ALL_QUANTIZATIONS: 'non-quantized,quantized-int4-tile-packed,quantized-int4-weight-only'
6666
NUM_RUNS: ${{ inputs.num_runs || '50' }}
6767
RUN_ALL_MODELS: ${{ inputs.run_all_models || 'false' }}
@@ -234,6 +234,12 @@ jobs:
234234
if [ -f "${RUNNER_ARTIFACT_DIR}/output.wav" ]; then
235235
cp "${RUNNER_ARTIFACT_DIR}/output.wav" model_artifacts/
236236
fi
237+
if [ -f "${RUNNER_ARTIFACT_DIR}/tokenizer.model" ]; then
238+
cp "${RUNNER_ARTIFACT_DIR}/tokenizer.model" model_artifacts/
239+
fi
240+
if [ -f "${RUNNER_ARTIFACT_DIR}/test_audio.wav" ]; then
241+
cp "${RUNNER_ARTIFACT_DIR}/test_audio.wav" model_artifacts/
242+
fi
237243
# Copy tokenizer files
238244
for file in tokenizer.json tokenizer_config.json special_tokens_map.json; do
239245
if [ -f "${RUNNER_ARTIFACT_DIR}/$file" ]; then
@@ -286,6 +292,13 @@ jobs:
286292
RUNNER_CMD="$RUNNER --model_path model_artifacts/model.pte --data_path model_artifacts/aoti_cuda_blob.ptd --tokenizer_path model_artifacts/ --image_path $IMAGE --temperature 0"
287293
MODEL_NAME="gemma3_${{ matrix.quant }}"
288294
;;
295+
nvidia/parakeet-tdt)
296+
RUNNER="cmake-out/examples/models/parakeet/parakeet_runner"
297+
AUDIO="model_artifacts/test_audio.wav"
298+
TOKENIZER="model_artifacts/tokenizer.model"
299+
RUNNER_CMD="$RUNNER --model_path model_artifacts/model.pte --data_path model_artifacts/aoti_cuda_blob.ptd --audio_path $AUDIO --tokenizer_path $TOKENIZER"
300+
MODEL_NAME="parakeet_${{ matrix.quant }}"
301+
;;
289302
*)
290303
echo "Error: Unsupported model '${{ matrix.model }}'"
291304
exit 1

0 commit comments

Comments
 (0)