Create an inference endpoint to perform an inference task with the jinaai service.
To review the available rerank models, refer to https://jina.ai/reranker.
To review the available embedding and text_embedding models, refer to https://jina.ai/embeddings/.
Required authorization
- Cluster privileges:
manage_inference
Path parameters
-
The type of the inference task that the model will perform.
Values are
embedding,rerank, ortext_embedding. -
The unique identifier of the inference endpoint.
Query parameters
-
Specifies the amount of time to wait for the inference endpoint to be created.
External documentation
Body
Required
-
The chunking configuration object. Applies only to the
embeddingand text_embeddingtask types. Not applicable to thererank` task type.External documentation -
The type of service supported for the specified task type. In this case,
jinaai.Value is
jinaai. -
Settings used to install the inference model. These settings are specific to the
jinaaiservice. -
Settings to configure the inference task. These settings are specific to the task type you specified.
PUT _inference/text_embedding/jinaai-embeddings
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
resp = client.inference.put(
task_type="text_embedding",
inference_id="jinaai-embeddings",
inference_config={
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
},
)
const response = await client.inference.put({
task_type: "text_embedding",
inference_id: "jinaai-embeddings",
inference_config: {
service: "jinaai",
service_settings: {
model_id: "jina-embeddings-v3",
api_key: "JinaAi-Api-key",
},
},
});
response = client.inference.put(
task_type: "text_embedding",
inference_id: "jinaai-embeddings",
body: {
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
)
$resp = $client->inference()->put([
"task_type" => "text_embedding",
"inference_id" => "jinaai-embeddings",
"body" => [
"service" => "jinaai",
"service_settings" => [
"model_id" => "jina-embeddings-v3",
"api_key" => "JinaAi-Api-key",
],
],
]);
curl -X PUT -H "Authorization: ApiKey $ELASTIC_API_KEY" -H "Content-Type: application/json" -d '{"service":"jinaai","service_settings":{"model_id":"jina-embeddings-v3","api_key":"JinaAi-Api-key"}}' "$ELASTICSEARCH_URL/_inference/text_embedding/jinaai-embeddings"
client.inference().put(p -> p
.inferenceId("jinaai-embeddings")
.taskType(TaskType.TextEmbedding)
.inferenceConfig(i -> i
.service("jinaai")
.serviceSettings(JsonData.fromJson("{\"model_id\":\"jina-embeddings-v3\",\"api_key\":\"JinaAi-Api-key\"}"))
)
);
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
{
"service": "jinaai",
"service_settings": {
"api_key": "JinaAI-Api-key",
"model_id": "jina-reranker-v2-base-multilingual"
},
"task_settings": {
"top_n": 10,
"return_documents": true
}
}
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v4",
"api_key": "JinaAi-Api-key"
}
}
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key",
"multimodal_model": false
}
}
{
"inference_id": "jinaai-embeddings",
"task_type": "text_embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 1024,
"embedding_type": "float",
"similarity": "dot_product"
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}
{
"inference_id": "jinaai-rerank",
"task_type": "rerank",
"service": "jinaai",
"service_settings": {
"model_id": "jina-reranker-v2-base-multilingual",
"rate_limit": {
"requests_per_minute": 2000
}
},
"task_settings": {
"top_n": 10,
"return_documents": true
}
}
{
"inference_id": "jinaai-embeddings-multimodal",
"task_type": "embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v4",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 2048,
"embedding_type": "float",
"similarity": "dot_product",
"multimodal_model": true
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}
{
"inference_id": "jinaai-embeddings-text-only",
"task_type": "embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 1024,
"embedding_type": "float",
"similarity": "dot_product",
"multimodal_model": false
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}