Add automatic retry for 429/503 with exponential backoff

This commit is contained in:
Franz Kafka 2026-04-16 19:00:37 +00:00
parent 29292addac
commit 78b3239bbd
3 changed files with 89 additions and 7 deletions

View file

@ -6,6 +6,10 @@ upstream_url: "https://api.z.ai/api/anthropic"
# Remove this line or set to null to use client-specified temperatures
# temperature: 0.7
# Retry configuration for transient errors (429, 503)
max_retries: 3
retry_base_delay_ms: 1000
models:
- id: "glm-4.7"
owned_by: "zhipu"