Add support for logit_bias outside of server api. Closes #827 · aniljava/llama-cpp-python@07e47f5 · GitHub
Skip to content

Commit 07e47f5

Browse files
committed
Add support for logit_bias outside of server api. Closes abetlen#827
1 parent c21edb6 commit 07e47f5

3 files changed

Lines changed: 44 additions & 38 deletions

File tree

llama_cpp/llama.py

Lines changed: 25 additions & 0 deletions

llama_cpp/llama_chat_format.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ def __call__(
4545
model: Optional[str] = None,
4646
logits_processor: Optional[llama.LogitsProcessorList] = None,
4747
grammar: Optional[llama.LlamaGrammar] = None,
48+
logit_bias: Optional[Dict[str, float]] = None,
4849
**kwargs, # type: ignore
4950
) -> Union[
5051
llama_types.CreateChatCompletionResponse,
@@ -308,6 +309,7 @@ def basic_create_chat_completion(
308309
model: Optional[str] = None,
309310
logits_processor: Optional[llama.LogitsProcessorList] = None,
310311
grammar: Optional[llama.LlamaGrammar] = None,
312+
logit_bias: Optional[Dict[str, float]] = None,
311313
**kwargs, # type: ignore
312314
) -> Union[
313315
llama_types.CreateChatCompletionResponse,
@@ -350,6 +352,7 @@ def basic_create_chat_completion(
350352
model=model,
351353
logits_processor=logits_processor,
352354
grammar=grammar,
355+
logit_bias=logit_bias,
353356
)
354357
return _convert_completion_to_chat(completion_or_chunks, stream=stream)
355358

llama_cpp/server/app.py

Lines changed: 16 additions & 38 deletions

0 commit comments

Comments
 (0)