From 78ab10ae8c4ef68818b37e929aca6cc6628c6d2d Mon Sep 17 00:00:00 2001 From: Brendan Jugan Date: Mon, 28 Apr 2025 19:16:55 -0400 Subject: [PATCH] handle rate limiting retries for Elastic Inference Service --- .../elastic/ElasticInferenceServiceResponseHandler.java | 2 ++ 1 file changed, 2 insertions(+) diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceServiceResponseHandler.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceServiceResponseHandler.java index 61b4708b4d7cb..fcc80e686564a 100644 --- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceServiceResponseHandler.java +++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceServiceResponseHandler.java @@ -40,6 +40,8 @@ protected void checkForFailureStatusCode(Request request, HttpResult result) thr throw new RetryException(false, buildError(METHOD_NOT_ALLOWED, request, result)); } else if (statusCode == 413) { throw new ContentTooLargeException(buildError(CONTENT_TOO_LARGE, request, result)); + } else if (statusCode == 429) { + throw new RetryException(true, buildError(RATE_LIMIT, request, result)); } throw new RetryException(false, buildError(UNSUCCESSFUL, request, result));