File tree Expand file tree Collapse file tree 2 files changed +4
-4
lines changed Expand file tree Collapse file tree 2 files changed +4
-4
lines changed Original file line number Diff line number Diff line change 3333 MINIMUM_ACCURACY_THRESHOLD : 0.31
3434 commands :
3535 - |
36- .buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/test_llama_guard_4_accuracy .sh
36+ .buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/safety_model_benchmark .sh --mode accuracy
3737 - label : " Record integration test result for meta-llama/Llama-Guard-4-12B"
3838 key : " record_meta-llama_Llama-Guard-4-12B_IntegrationTest"
3939 depends_on : " meta-llama_Llama-Guard-4-12B_IntegrationTest"
5454 queue : tpu_v6e_queue
5555 commands :
5656 - |
57- .buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/llama_guard_perf_recipe .sh
57+ .buildkite/scripts/run_in_docker.sh bash /workspace/tpu_inference/tests/e2e/benchmarking/safety_model_benchmark .sh --mode performance
5858
5959 - label : " Record performance benchmark result for meta-llama/Llama-Guard-4-12B"
6060 key : " record_meta-llama_Llama-Guard-4-12B_Benchmark"
Original file line number Diff line number Diff line change @@ -44,8 +44,8 @@ OUTPUT_LEN_OVERRIDE=20 # Max tokens to generate for safety classification
4444# --- DATA PATHS ---
4545# Source URL for the AILuminate CSV (Public Raw GitHub Link)
4646RAW_CSV_URL=" https://raw.githubusercontent.com/mlcommons/ailuminate/main/airr_official_1.0_demo_en_us_prompt_set_release.csv"
47- LOCAL_CSV_FILE=" /tmp/airr_official_1.0_demo_en_us_prompt_set_release.csv" # Local file path for Pytest
48- # GCS_JSONL_URI="gs://jiries/datasets/ailuminate/ airr_official_1.0_demo_en_us_prompt_set_release.jsonl"
47+ LOCAL_CSV_FILE=" /tmp/airr_official_1.0_demo_en_us_prompt_set_release.csv"
48+ LOCAL_JSONL_FILE= " /tmp/ airr_official_1.0_demo_en_us_prompt_set_release.jsonl"
4949# ------------------
5050
5151TEST_MODE=" "
You can’t perform that action at this time.
0 commit comments