aboutsummaryrefslogtreecommitdiffstats
path: root/pkg/aflow/llm_agent.go
diff options
context:
space:
mode:
authorDmitry Vyukov <dvyukov@google.com>2026-01-16 09:33:14 +0100
committerDmitry Vyukov <dvyukov@google.com>2026-01-20 21:12:57 +0000
commit91e26ec437abcd42a8255aa88e31b45da059529e (patch)
treec9e6e26949375e3ae053f1fc84fe749e69d5cabc /pkg/aflow/llm_agent.go
parent7f5908e77ae0e7fef4b7901341b8c2c4bbb74b28 (diff)
pkg/aflow: handle model quota errors
Detect model quota violations (assumed to be RPD). Make syz-agent not request jobs that use the model until the next quota reset time. Fixes #6573
Diffstat (limited to 'pkg/aflow/llm_agent.go')
-rw-r--r--pkg/aflow/llm_agent.go9
1 files changed, 8 insertions, 1 deletions
diff --git a/pkg/aflow/llm_agent.go b/pkg/aflow/llm_agent.go
index 3c416b37c..d5e4d6d4d 100644
--- a/pkg/aflow/llm_agent.go
+++ b/pkg/aflow/llm_agent.go
@@ -9,6 +9,7 @@ import (
"maps"
"net/http"
"reflect"
+ "strings"
"time"
"github.com/google/syzkaller/pkg/aflow/trajectory"
@@ -289,8 +290,9 @@ func (a *LLMAgent) parseResponse(resp *genai.GenerateContentResponse) (
func (a *LLMAgent) generateContent(ctx *Context, cfg *genai.GenerateContentConfig,
req []*genai.Content) (*genai.GenerateContentResponse, error) {
backoff := time.Second
+ model := ctx.modelName(a.Model)
for try := 0; ; try++ {
- resp, err := ctx.generateContent(ctx.modelName(a.Model), cfg, req)
+ resp, err := ctx.generateContent(model, cfg, req)
var apiErr genai.APIError
if err != nil && try < 100 && errors.As(err, &apiErr) &&
apiErr.Code == http.StatusServiceUnavailable {
@@ -298,6 +300,11 @@ func (a *LLMAgent) generateContent(ctx *Context, cfg *genai.GenerateContentConfi
backoff = min(backoff+time.Second, 10*time.Second)
continue
}
+ if err != nil && errors.As(err, &apiErr) && apiErr.Code == http.StatusTooManyRequests &&
+ strings.Contains(apiErr.Message, "Quota exceeded for metric") &&
+ strings.Contains(apiErr.Message, "generate_requests_per_model_per_day") {
+ return resp, &modelQuotaError{model}
+ }
return resp, err
}
}