mirror of
https://github.com/elastic/elasticsearch.git
synced 2025-06-29 01:44:36 -04:00
[DOCS] Fixes adaptive_allocations examples (#113248)
Co-authored-by: Jan Kuipers <148754765+jan-elastic@users.noreply.github.com>
This commit is contained in:
parent
1b2b202ef7
commit
9b7d808bf4
3 changed files with 10 additions and 2 deletions
|
@ -179,6 +179,7 @@ PUT _inference/text_embedding/my-e5-model
|
|||
"min_number_of_allocations": 3,
|
||||
"max_number_of_allocations": 10
|
||||
},
|
||||
"num_threads": 1,
|
||||
"model_id": ".multilingual-e5-small"
|
||||
}
|
||||
}
|
||||
|
|
|
@ -147,7 +147,8 @@ PUT _inference/sparse_embedding/my-elser-model
|
|||
"enabled": true,
|
||||
"min_number_of_allocations": 3,
|
||||
"max_number_of_allocations": 10
|
||||
}
|
||||
},
|
||||
"num_threads": 1
|
||||
}
|
||||
}
|
||||
------------------------------------------------------------
|
||||
|
|
|
@ -36,7 +36,11 @@ PUT _inference/sparse_embedding/my-elser-endpoint <1>
|
|||
{
|
||||
"service": "elser", <2>
|
||||
"service_settings": {
|
||||
"num_allocations": 1,
|
||||
"adaptive_allocations": { <3>
|
||||
"enabled": true,
|
||||
"min_number_of_allocations": 3,
|
||||
"max_number_of_allocations": 10
|
||||
},
|
||||
"num_threads": 1
|
||||
}
|
||||
}
|
||||
|
@ -46,6 +50,8 @@ PUT _inference/sparse_embedding/my-elser-endpoint <1>
|
|||
be used and ELSER creates sparse vectors. The `inference_id` is
|
||||
`my-elser-endpoint`.
|
||||
<2> The `elser` service is used in this example.
|
||||
<3> This setting enables and configures {ml-docs}/ml-nlp-elser.html#elser-adaptive-allocations[adaptive allocations].
|
||||
Adaptive allocations make it possible for ELSER to automatically scale up or down resources based on the current load on the process.
|
||||
|
||||
[NOTE]
|
||||
====
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue