elastic
diff --git a/‎output/openapi/elasticsearch-openapi.json
Lines changed: 1 addition & 1 deletion b/‎output/openapi/elasticsearch-openapi.json
Lines changed: 1 addition & 1 deletion
diff --git a/‎output/openapi/elasticsearch-serverless-openapi.json
Lines changed: 1 addition & 1 deletion b/‎output/openapi/elasticsearch-serverless-openapi.json
Lines changed: 1 addition & 1 deletion
diff --git a/‎output/schema/schema.json
Lines changed: 3 additions & 2 deletions b/‎output/schema/schema.json
Lines changed: 3 additions & 2 deletions
diff --git a/‎specification/inference/_types/Services.ts
Lines changed: 21 additions & 0 deletions b/‎specification/inference/_types/Services.ts
Lines changed: 21 additions & 0 deletions
@@ -286,9 +286,30 @@ export type ServiceSettings = UserDefinedValue
 
 export type TaskSettings = UserDefinedValue
 
+/**
+ * This setting helps to minimize the number of rate limit errors returned from the service.
+ */
 export class RateLimitSetting {
   /**
    * The number of requests allowed per minute.
+   * By default, the number of requests allowed per minute is set by each service as follows:
+   *
+   * * `alibabacloud-ai-search` service: `1000`
+   * * `anthropic` service: `50`
+   * * `azureaistudio` service: `240`
+   * * `azureopenai` service and task type `text_embedding`: `1440`
+   * * `azureopenai` service and task type `completion`: `120`
+   * * `cohere` service: `10000`
+   * * `elastic` service and task type `chat_completion`: `240`
+   * * `googleaistudio` service: `360`
+   * * `googlevertexai` service: `30000`
+   * * `hugging_face` service: `3000`
+   * * `jinaai` service: `2000`
+   * * `mistral` service: `240`
+   * * `openai` service and task type `text_embedding`: `3000`
+   * * `openai` service and task type `completion`: `500`
+   * * `voyageai` service: `2000`
+   * * `watsonxai` service: `120`
    */
   requests_per_minute?: integer
 }