Create a Cohere inference endpoint Generally available; Added in 8.13.0
Path parameters
-
The type of the inference task that the model will perform.
Values are
completion
,rerank
, ortext_embedding
. -
The unique identifier of the inference endpoint.
PUT /_inference/{task_type}/{cohere_inference_id}
Console
PUT _inference/text_embedding/cohere-embeddings { "service": "cohere", "service_settings": { "api_key": "Cohere-Api-key", "model_id": "embed-english-light-v3.0", "embedding_type": "byte" } }
resp = client.inference.put( task_type="text_embedding", inference_id="cohere-embeddings", inference_config={ "service": "cohere", "service_settings": { "api_key": "Cohere-Api-key", "model_id": "embed-english-light-v3.0", "embedding_type": "byte" } }, )
const response = await client.inference.put({ task_type: "text_embedding", inference_id: "cohere-embeddings", inference_config: { service: "cohere", service_settings: { api_key: "Cohere-Api-key", model_id: "embed-english-light-v3.0", embedding_type: "byte", }, }, });
response = client.inference.put( task_type: "text_embedding", inference_id: "cohere-embeddings", body: { "service": "cohere", "service_settings": { "api_key": "Cohere-Api-key", "model_id": "embed-english-light-v3.0", "embedding_type": "byte" } } )
$resp = $client->inference()->put([ "task_type" => "text_embedding", "inference_id" => "cohere-embeddings", "body" => [ "service" => "cohere", "service_settings" => [ "api_key" => "Cohere-Api-key", "model_id" => "embed-english-light-v3.0", "embedding_type" => "byte", ], ], ]);
curl -X PUT -H "Authorization: ApiKey $ELASTIC_API_KEY" -H "Content-Type: application/json" -d '{"service":"cohere","service_settings":{"api_key":"Cohere-Api-key","model_id":"embed-english-light-v3.0","embedding_type":"byte"}}' "$ELASTICSEARCH_URL/_inference/text_embedding/cohere-embeddings"
client.inference().put(p -> p .inferenceId("cohere-embeddings") .taskType(TaskType.TextEmbedding) .inferenceConfig(i -> i .service("cohere") .serviceSettings(JsonData.fromJson("{\"api_key\":\"Cohere-Api-key\",\"model_id\":\"embed-english-light-v3.0\",\"embedding_type\":\"byte\"}")) ) );
Request examples
A text embedding task
Run `PUT _inference/text_embedding/cohere-embeddings` to create an inference endpoint that performs a text embedding task.
{ "service": "cohere", "service_settings": { "api_key": "Cohere-Api-key", "model_id": "embed-english-light-v3.0", "embedding_type": "byte" } }
Run `PUT _inference/rerank/cohere-rerank` to create an inference endpoint that performs a rerank task.
{ "service": "cohere", "service_settings": { "api_key": "Cohere-API-key", "model_id": "rerank-english-v3.0" }, "task_settings": { "top_n": 10, "return_documents": true } }