From 358cd7225a1e42d30c11301ad8d27a1ebec4f1b4 Mon Sep 17 00:00:00 2001 From: Justin Uberti Date: Mon, 29 Jul 2024 14:32:24 -0700 Subject: [PATCH] Use 50 max tokens for function calls (#32) --- .github/workflows/bench.yml | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/.github/workflows/bench.yml b/.github/workflows/bench.yml index 802591d..6be84cf 100644 --- a/.github/workflows/bench.yml +++ b/.github/workflows/bench.yml @@ -16,10 +16,15 @@ jobs: # Pre-warm any spun-down instances (only audio right now) curl -f -X POST "https://ai-benchmarks.fly.dev/bench?mode=audio&max_tokens=20&num_requests=1" # Run the benchmarks + declare -A max_tokens=( + ["tools"]=50 + ) + default_max_tokens=20 regions=("sea" "iad" "cdg") media=("text" "tools" "image" "audio") for region in "${regions[@]}"; do for medium in "${media[@]}"; do - curl -f -X POST "https://ai-benchmarks.fly.dev/bench?mode=$medium&max_tokens=20&spread=30&store" -H "fly-prefer-region: $region" + max_tokens=${max_tokens[$medium]:-$default_max_tokens} + curl -f -X POST "https://ai-benchmarks.fly.dev/bench?mode=$medium&max_tokens=$max_tokens&spread=30&store" -H "fly-prefer-region: $region" done done