Create an inference endpoint to perform an inference task with the jinaai service.
To review the available rerank models, refer to https://jina.ai/reranker.
To review the available embedding and text_embedding models, refer to https://jina.ai/embeddings/.
manage_inferenceThe type of the inference task that the model will perform.
Values are embedding, rerank, or text_embedding.
The unique identifier of the inference endpoint.
Specifies the amount of time to wait for the inference endpoint to be created.
The chunking configuration object.
Applies only to the embedding and text_embeddingtask types.
Not applicable to thererank` task type.
The type of service supported for the specified task type. In this case, jinaai.
Value is jinaai.
Settings used to install the inference model. These settings are specific to the jinaai service.
Settings to configure the inference task. These settings are specific to the task type you specified.
PUT _inference/text_embedding/jinaai-embeddings
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
resp = client.inference.put(
task_type="text_embedding",
inference_id="jinaai-embeddings",
inference_config={
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
},
)
const response = await client.inference.put({
task_type: "text_embedding",
inference_id: "jinaai-embeddings",
inference_config: {
service: "jinaai",
service_settings: {
model_id: "jina-embeddings-v3",
api_key: "JinaAi-Api-key",
},
},
});
response = client.inference.put(
task_type: "text_embedding",
inference_id: "jinaai-embeddings",
body: {
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
)
$resp = $client->inference()->put([
"task_type" => "text_embedding",
"inference_id" => "jinaai-embeddings",
"body" => [
"service" => "jinaai",
"service_settings" => [
"model_id" => "jina-embeddings-v3",
"api_key" => "JinaAi-Api-key",
],
],
]);
curl -X PUT -H "Authorization: ApiKey $ELASTIC_API_KEY" -H "Content-Type: application/json" -d '{"service":"jinaai","service_settings":{"model_id":"jina-embeddings-v3","api_key":"JinaAi-Api-key"}}' "$ELASTICSEARCH_URL/_inference/text_embedding/jinaai-embeddings"
client.inference().put(p -> p
.inferenceId("jinaai-embeddings")
.taskType(TaskType.TextEmbedding)
.inferenceConfig(i -> i
.service("jinaai")
.serviceSettings(JsonData.fromJson("{\"model_id\":\"jina-embeddings-v3\",\"api_key\":\"JinaAi-Api-key\"}"))
)
);
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key"
}
}
{
"service": "jinaai",
"service_settings": {
"api_key": "JinaAI-Api-key",
"model_id": "jina-reranker-v2-base-multilingual"
},
"task_settings": {
"top_n": 10,
"return_documents": true
}
}
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v4",
"api_key": "JinaAi-Api-key"
}
}
{
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"api_key": "JinaAi-Api-key",
"multimodal_model": false
}
}
{
"inference_id": "jinaai-embeddings",
"task_type": "text_embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 1024,
"embedding_type": "float",
"similarity": "dot_product"
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}
{
"inference_id": "jinaai-rerank",
"task_type": "rerank",
"service": "jinaai",
"service_settings": {
"model_id": "jina-reranker-v2-base-multilingual",
"rate_limit": {
"requests_per_minute": 2000
}
},
"task_settings": {
"top_n": 10,
"return_documents": true
}
}
{
"inference_id": "jinaai-embeddings-multimodal",
"task_type": "embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v4",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 2048,
"embedding_type": "float",
"similarity": "dot_product",
"multimodal_model": true
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}
{
"inference_id": "jinaai-embeddings-text-only",
"task_type": "embedding",
"service": "jinaai",
"service_settings": {
"model_id": "jina-embeddings-v3",
"rate_limit": {
"requests_per_minute": 2000
},
"dimensions": 1024,
"embedding_type": "float",
"similarity": "dot_product",
"multimodal_model": false
},
"chunking_settings": {
"strategy": "sentence",
"max_chunk_size": 250,
"sentence_overlap": 1
}
}