Skip to content

Commit 8d4c35a

Browse files
committed
Fixed dataset download issue and modified buidlkite CI yml to reflect new perf and accuracy script changes
1 parent 9db0de2 commit 8d4c35a

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

.buildkite/models/meta-llama_Llama-Guard-4-12B.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ steps:
3333
MINIMUM_ACCURACY_THRESHOLD: 0.31
3434
commands:
3535
- |
36-
.buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/test_llama_guard_4_accuracy.sh
36+
.buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/safety_model_benchmark.sh --mode accuracy
3737
- label: "Record integration test result for meta-llama/Llama-Guard-4-12B"
3838
key: "record_meta-llama_Llama-Guard-4-12B_IntegrationTest"
3939
depends_on: "meta-llama_Llama-Guard-4-12B_IntegrationTest"
@@ -54,7 +54,7 @@ steps:
5454
queue: tpu_v6e_queue
5555
commands:
5656
- |
57-
.buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/llama_guard_perf_recipe.sh
57+
.buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/safety_model_benchmark.sh --mode performance
5858
5959
- label: "Record performance benchmark result for meta-llama/Llama-Guard-4-12B"
6060
key: "record_meta-llama_Llama-Guard-4-12B_Benchmark"

tests/e2e/benchmarking/safety_model_benchmark.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -44,8 +44,8 @@ OUTPUT_LEN_OVERRIDE=20 # Max tokens to generate for safety classification
4444
# --- DATA PATHS ---
4545
# Source URL for the AILuminate CSV (Public Raw GitHub Link)
4646
RAW_CSV_URL="https://raw.githubusercontent.com/mlcommons/ailuminate/main/airr_official_1.0_demo_en_us_prompt_set_release.csv"
47-
LOCAL_CSV_FILE="/tmp/airr_official_1.0_demo_en_us_prompt_set_release.csv" # Local file path for Pytest
48-
#GCS_JSONL_URI="gs://jiries/datasets/ailuminate/airr_official_1.0_demo_en_us_prompt_set_release.jsonl"
47+
LOCAL_CSV_FILE="/tmp/airr_official_1.0_demo_en_us_prompt_set_release.csv"
48+
LOCAL_JSONL_FILE="/tmp/airr_official_1.0_demo_en_us_prompt_set_release.jsonl"
4949
# ------------------
5050

5151
TEST_MODE=""

0 commit comments

Comments
 (0)