elastic · lcawl · Jun 5, 2025
diff --git a/output/openapi/elasticsearch-openapi.json b/output/openapi/elasticsearch-openapi.json
diff --git a/output/openapi/elasticsearch-serverless-openapi.json b/output/openapi/elasticsearch-serverless-openapi.json
diff --git a/output/schema/schema.json b/output/schema/schema.json
diff --git a/specification/inference/_types/Services.ts b/specification/inference/_types/Services.ts
@@ -286,9 +286,30 @@ export type ServiceSettings = UserDefinedValue
 
 export type TaskSettings = UserDefinedValue
 
+/**
+ * This setting helps to minimize the number of rate limit errors returned from the service.
+ */
 export class RateLimitSetting {
   /**
    * The number of requests allowed per minute.
+   * By default, the number of requests allowed per minute is set by each service as follows:
+   *
+   * * `alibabacloud-ai-search` service: `1000`
+   * * `anthropic` service: `50`
+   * * `azureaistudio` service: `240`
+   * * `azureopenai` service and task type `text_embedding`: `1440`
+   * * `azureopenai` service and task type `completion`: `120`
+   * * `cohere` service: `10000`
+   * * `elastic` service and task type `chat_completion`: `240`
+   * * `googleaistudio` service: `360`
+   * * `googlevertexai` service: `30000`
+   * * `hugging_face` service: `3000`
+   * * `jinaai` service: `2000`
+   * * `mistral` service: `240`
+   * * `openai` service and task type `text_embedding`: `3000`
+   * * `openai` service and task type `completion`: `500`
+   * * `voyageai` service: `2000`
+   * * `watsonxai` service: `120`
    */
   requests_per_minute?: integer
 }