Perform dense embedding inference on the service
POST
/_inference/embedding/{inference_id} Parameters
path Path Parameters
| Name | Type |
|---|---|
inference_id
required
The inference Id | type TypesId = string |
query Query Parameters
| Name | Type |
|---|---|
timeout Specifies the amount of time to wait for the inference request to complete. | type TypesDuration = string | "-1" | "0" |
Request Body
application/json
required
interface InferenceTypesRequestEmbedding {
input:InferenceTypesEmbeddingInput ;
input_type?: string;
task_settings?:InferenceTypesTaskSettings ;
}
input:
input_type?: string;
task_settings?:
}
Responses
200 application/json
interface InferenceTypesEmbeddingInferenceResult {
embeddings_bytes?:InferenceTypesDenseEmbeddingByteResult [];
embeddings_bits?:InferenceTypesDenseEmbeddingByteResult [];
embeddings?:InferenceTypesDenseEmbeddingResult [];
}
embeddings_bytes?:
embeddings_bits?:
embeddings?:
}