The type of the inference task that the model will perform.
Values are rerank, text_embedding, completion, or chat_completion.
The unique identifier of the inference endpoint.
Specifies the amount of time to wait for the inference endpoint to be created.
The chunking configuration object.
Applies only to the text_embedding task type.
Not applicable to the rerank, completion, or chat_completion task types.
The type of service supported for the specified task type. In this case, googlevertexai.
Value is googlevertexai.
Settings used to install the inference model. These settings are specific to the googlevertexai service.
Settings to configure the inference task. These settings are specific to the task type you specified.
PUT _inference/text_embedding/google_vertex_ai_embeddingss
{
"service": "googlevertexai",
"service_settings": {
"service_account_json": "service-account-json",
"model_id": "model-id",
"location": "location",
"project_id": "project-id"
}
}
resp = client.inference.put(
task_type="text_embedding",
inference_id="google_vertex_ai_embeddingss",
inference_config={
"service": "googlevertexai",
"service_settings": {
"service_account_json": "service-account-json",
"model_id": "model-id",
"location": "location",
"project_id": "project-id"
}
},
)
const response = await client.inference.put({
task_type: "text_embedding",
inference_id: "google_vertex_ai_embeddingss",
inference_config: {
service: "googlevertexai",
service_settings: {
service_account_json: "service-account-json",
model_id: "model-id",
location: "location",
project_id: "project-id",
},
},
});
response = client.inference.put(
task_type: "text_embedding",
inference_id: "google_vertex_ai_embeddingss",
body: {
"service": "googlevertexai",
"service_settings": {
"service_account_json": "service-account-json",
"model_id": "model-id",
"location": "location",
"project_id": "project-id"
}
}
)
$resp = $client->inference()->put([
"task_type" => "text_embedding",
"inference_id" => "google_vertex_ai_embeddingss",
"body" => [
"service" => "googlevertexai",
"service_settings" => [
"service_account_json" => "service-account-json",
"model_id" => "model-id",
"location" => "location",
"project_id" => "project-id",
],
],
]);
curl -X PUT -H "Authorization: ApiKey $ELASTIC_API_KEY" -H "Content-Type: application/json" -d '{"service":"googlevertexai","service_settings":{"service_account_json":"service-account-json","model_id":"model-id","location":"location","project_id":"project-id"}}' "$ELASTICSEARCH_URL/_inference/text_embedding/google_vertex_ai_embeddingss"
client.inference().put(p -> p
.inferenceId("google_vertex_ai_embeddingss")
.taskType(TaskType.TextEmbedding)
.inferenceConfig(i -> i
.service("googlevertexai")
.serviceSettings(JsonData.fromJson("{\"service_account_json\":\"service-account-json\",\"model_id\":\"model-id\",\"location\":\"location\",\"project_id\":\"project-id\"}"))
)
);
{
"service": "googlevertexai",
"service_settings": {
"service_account_json": "service-account-json",
"model_id": "model-id",
"location": "location",
"project_id": "project-id"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "hugging_face",
"service_account_json": "service-account-json",
"url": "https://%ENDPOINT_ID%.%LOCATION_ID%-%PROJECT_ID%.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "hugging_face",
"service_account_json": "service-account-json",
"streaming_url": "https://%ENDPOINT_ID%.%LOCATION_ID%-%PROJECT_ID%.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "hugging_face",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "hugging_face",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"model_id": "mistral-small-2503",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/mistralai/models/%MODEL_ID%:rawPredict",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/mistralai/models/%MODEL_ID%:streamRawPredict"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"model_id": "mistral-small-2503",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/mistralai/models/%MODEL_ID%:streamRawPredict"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"service_account_json": "service-account-json",
"url": "https://%ENDPOINT_ID%.%LOCATION_ID%-%PROJECT_ID%.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"service_account_json": "service-account-json",
"streaming_url": "https://%ENDPOINT_ID%.%LOCATION_ID%-%PROJECT_ID%.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"service_account_json": "service-account-json",
"project_id": "project-id"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "mistral",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "ai21",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/ai21/models/%MODEL_ID%:rawPredict",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/ai21/models/%MODEL_ID%:streamRawPredict"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "ai21",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/ai21/models/%MODEL_ID%:streamRawPredict"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "anthropic",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/anthropic/models/%MODEL_ID%:rawPredict",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/anthropic/models/%MODEL_ID%:streamRawPredict"
},
"task_settings": {
"max_tokens": 128
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "anthropic",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/publishers/anthropic/models/%MODEL_ID%:streamRawPredict"
},
"task_settings": {
"max_tokens": 128
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"model_id": "meta/llama-3.3-70b-instruct-maas",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/openapi/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"model_id": "meta/llama-3.3-70b-instruct-maas",
"service_account_json": "service-account-json",
"streaming_url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/openapi/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"service_account_json": "service-account-json",
"url": "https://%ENDPOINT_ID%.%LOCATION_ID%-fasttryout.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"service_account_json": "service-account-json",
"streaming_url": "https://%ENDPOINT_ID%.%LOCATION_ID%-fasttryout.prediction.vertexai.goog/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}
{
"service": "googlevertexai",
"service_settings": {
"provider": "meta",
"service_account_json": "service-account-json",
"url": "https://%LOCATION_ID%-aiplatform.googleapis.com/v1/projects/%PROJECT_ID%/locations/%LOCATION_ID%/endpoints/%ENDPOINT_ID%/chat/completions"
}
}