@@ -658,7 +658,7 @@ def sample(
658
658
min_p : float = 0.05 ,
659
659
typical_p : float = 1.0 ,
660
660
temp : float = 0.80 ,
661
- repeat_penalty : float = 1.1 ,
661
+ repeat_penalty : float = 1.0 ,
662
662
frequency_penalty : float = 0.0 ,
663
663
presence_penalty : float = 0.0 ,
664
664
tfs_z : float = 1.0 ,
@@ -733,7 +733,7 @@ def generate(
733
733
min_p : float = 0.05 ,
734
734
typical_p : float = 1.0 ,
735
735
temp : float = 0.80 ,
736
- repeat_penalty : float = 1.1 ,
736
+ repeat_penalty : float = 1.0 ,
737
737
reset : bool = True ,
738
738
frequency_penalty : float = 0.0 ,
739
739
presence_penalty : float = 0.0 ,
@@ -751,7 +751,7 @@ def generate(
751
751
Examples:
752
752
>>> llama = Llama("models/ggml-7b.bin")
753
753
>>> tokens = llama.tokenize(b"Hello, world!")
754
- >>> for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1.0, repeat_penalty=1.1 ):
754
+ >>> for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1.0, repeat_penalty=1.0 ):
755
755
... print(llama.detokenize([token]))
756
756
757
757
Args:
@@ -1020,7 +1020,7 @@ def _create_completion(
1020
1020
stop : Optional [Union [str , List [str ]]] = [],
1021
1021
frequency_penalty : float = 0.0 ,
1022
1022
presence_penalty : float = 0.0 ,
1023
- repeat_penalty : float = 1.1 ,
1023
+ repeat_penalty : float = 1.0 ,
1024
1024
top_k : int = 40 ,
1025
1025
stream : bool = False ,
1026
1026
seed : Optional [int ] = None ,
@@ -1639,7 +1639,7 @@ def create_completion(
1639
1639
stop : Optional [Union [str , List [str ]]] = [],
1640
1640
frequency_penalty : float = 0.0 ,
1641
1641
presence_penalty : float = 0.0 ,
1642
- repeat_penalty : float = 1.1 ,
1642
+ repeat_penalty : float = 1.0 ,
1643
1643
top_k : int = 40 ,
1644
1644
stream : bool = False ,
1645
1645
seed : Optional [int ] = None ,
@@ -1736,7 +1736,7 @@ def __call__(
1736
1736
stop : Optional [Union [str , List [str ]]] = [],
1737
1737
frequency_penalty : float = 0.0 ,
1738
1738
presence_penalty : float = 0.0 ,
1739
- repeat_penalty : float = 1.1 ,
1739
+ repeat_penalty : float = 1.0 ,
1740
1740
top_k : int = 40 ,
1741
1741
stream : bool = False ,
1742
1742
seed : Optional [int ] = None ,
@@ -1833,7 +1833,7 @@ def create_chat_completion(
1833
1833
max_tokens : Optional [int ] = None ,
1834
1834
presence_penalty : float = 0.0 ,
1835
1835
frequency_penalty : float = 0.0 ,
1836
- repeat_penalty : float = 1.1 ,
1836
+ repeat_penalty : float = 1.0 ,
1837
1837
tfs_z : float = 1.0 ,
1838
1838
mirostat_mode : int = 0 ,
1839
1839
mirostat_tau : float = 5.0 ,
0 commit comments