We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f774690 commit 0f3f883Copy full SHA for 0f3f883
1 file changed
llama_cpp/llama.py
@@ -1040,7 +1040,8 @@ def embed(
1040
1041
# get pooling information
1042
pooling_type = self.pooling_type()
1043
- logits_all = pooling_type == llama_cpp.LLAMA_POOLING_TYPE_NONE
+ # All tokens need outputs for embeddings; llama.cpp otherwise logs an "overriding" warning per input.
1044
+ logits_all = True
1045
1046
if self.context_params.embeddings is False:
1047
raise RuntimeError(
0 commit comments