@@ -658,7 +658,7 @@ def sample(
658658 min_p : float = 0.05 ,
659659 typical_p : float = 1.0 ,
660660 temp : float = 0.80 ,
661- repeat_penalty : float = 1.1 ,
661+ repeat_penalty : float = 1.0 ,
662662 frequency_penalty : float = 0.0 ,
663663 presence_penalty : float = 0.0 ,
664664 tfs_z : float = 1.0 ,
@@ -733,7 +733,7 @@ def generate(
733733 min_p : float = 0.05 ,
734734 typical_p : float = 1.0 ,
735735 temp : float = 0.80 ,
736- repeat_penalty : float = 1.1 ,
736+ repeat_penalty : float = 1.0 ,
737737 reset : bool = True ,
738738 frequency_penalty : float = 0.0 ,
739739 presence_penalty : float = 0.0 ,
@@ -751,7 +751,7 @@ def generate(
751751 Examples:
752752 >>> llama = Llama("models/ggml-7b.bin")
753753 >>> tokens = llama.tokenize(b"Hello, world!")
754- >>> for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1.0, repeat_penalty=1.1 ):
754+ >>> for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1.0, repeat_penalty=1.0 ):
755755 ... print(llama.detokenize([token]))
756756
757757 Args:
@@ -1020,7 +1020,7 @@ def _create_completion(
10201020 stop : Optional [Union [str , List [str ]]] = [],
10211021 frequency_penalty : float = 0.0 ,
10221022 presence_penalty : float = 0.0 ,
1023- repeat_penalty : float = 1.1 ,
1023+ repeat_penalty : float = 1.0 ,
10241024 top_k : int = 40 ,
10251025 stream : bool = False ,
10261026 seed : Optional [int ] = None ,
@@ -1639,7 +1639,7 @@ def create_completion(
16391639 stop : Optional [Union [str , List [str ]]] = [],
16401640 frequency_penalty : float = 0.0 ,
16411641 presence_penalty : float = 0.0 ,
1642- repeat_penalty : float = 1.1 ,
1642+ repeat_penalty : float = 1.0 ,
16431643 top_k : int = 40 ,
16441644 stream : bool = False ,
16451645 seed : Optional [int ] = None ,
@@ -1736,7 +1736,7 @@ def __call__(
17361736 stop : Optional [Union [str , List [str ]]] = [],
17371737 frequency_penalty : float = 0.0 ,
17381738 presence_penalty : float = 0.0 ,
1739- repeat_penalty : float = 1.1 ,
1739+ repeat_penalty : float = 1.0 ,
17401740 top_k : int = 40 ,
17411741 stream : bool = False ,
17421742 seed : Optional [int ] = None ,
@@ -1833,7 +1833,7 @@ def create_chat_completion(
18331833 max_tokens : Optional [int ] = None ,
18341834 presence_penalty : float = 0.0 ,
18351835 frequency_penalty : float = 0.0 ,
1836- repeat_penalty : float = 1.1 ,
1836+ repeat_penalty : float = 1.0 ,
18371837 tfs_z : float = 1.0 ,
18381838 mirostat_mode : int = 0 ,
18391839 mirostat_tau : float = 5.0 ,
0 commit comments