From 9b94e99e4d79fba5c306927f69333e49b1243eb3 Mon Sep 17 00:00:00 2001 From: Shaun Arman Date: Sat, 20 Jun 2026 19:49:42 -0500 Subject: [PATCH] ci(pr-review): increase LLM timeout to 600s, retry-max-time to 1200s qwen3.5-122b-think on a 253KB prompt was consistently hitting the 300s --max-time wall. --retry-max-time also equalled --max-time, so retries never fired. Now: 10 min per attempt, 2 retries, 20 min total budget. --- .gitea/workflows/pr-review.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.gitea/workflows/pr-review.yml b/.gitea/workflows/pr-review.yml index 7cc76c5a..69343692 100644 --- a/.gitea/workflows/pr-review.yml +++ b/.gitea/workflows/pr-review.yml @@ -290,8 +290,8 @@ jobs: '{model: $model, messages: [{role: "user", content: $content}], stream: false}' \ > /tmp/body.json echo "[$(date -u +%Y-%m-%dT%H:%M:%SZ)] PR #${PR_NUMBER} - Calling liteLLM API ($(wc -c < /tmp/body.json) bytes)..." - HTTP_CODE=$(curl -s --max-time 300 --connect-timeout 30 \ - --retry 3 --retry-delay 10 --retry-connrefused --retry-max-time 300 \ + HTTP_CODE=$(curl -s --max-time 600 --connect-timeout 30 \ + --retry 2 --retry-delay 15 --retry-connrefused --retry-max-time 1200 \ -o /tmp/llm_response.json -w "%{http_code}" \ -X POST "$LITELLM_URL/chat/completions" \ -H "Authorization: Bearer $LITELLM_API_KEY" \