You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: llama_cpp/llama.py
-17
Original file line number
Diff line number
Diff line change
@@ -677,7 +677,6 @@ def _init_sampler(
677
677
repeat_penalty: float=1.0,
678
678
frequency_penalty: float=0.0,
679
679
presence_penalty: float=0.0,
680
-
tfs_z: float=1.0,
681
680
mirostat_mode: int=0,
682
681
mirostat_eta: float=0.1,
683
682
mirostat_tau: float=5.0,
@@ -771,7 +770,6 @@ def sample(
771
770
repeat_penalty: float=1.0,
772
771
frequency_penalty: float=0.0,
773
772
presence_penalty: float=0.0,
774
-
tfs_z: float=1.0,
775
773
mirostat_mode: int=0,
776
774
mirostat_eta: float=0.1,
777
775
mirostat_tau: float=5.0,
@@ -809,7 +807,6 @@ def sample(
809
807
repeat_penalty=repeat_penalty,
810
808
frequency_penalty=frequency_penalty,
811
809
presence_penalty=presence_penalty,
812
-
tfs_z=tfs_z,
813
810
mirostat_mode=mirostat_mode,
814
811
mirostat_tau=mirostat_tau,
815
812
mirostat_eta=mirostat_eta,
@@ -841,7 +838,6 @@ def generate(
841
838
reset: bool=True,
842
839
frequency_penalty: float=0.0,
843
840
presence_penalty: float=0.0,
844
-
tfs_z: float=1.0,
845
841
mirostat_mode: int=0,
846
842
mirostat_tau: float=5.0,
847
843
mirostat_eta: float=0.1,
@@ -883,7 +879,6 @@ def generate(
883
879
repeat_penalty=repeat_penalty,
884
880
frequency_penalty=frequency_penalty,
885
881
presence_penalty=presence_penalty,
886
-
tfs_z=tfs_z,
887
882
mirostat_mode=mirostat_mode,
888
883
mirostat_tau=mirostat_tau,
889
884
mirostat_eta=mirostat_eta,
@@ -938,7 +933,6 @@ def generate(
938
933
repeat_penalty=repeat_penalty,
939
934
frequency_penalty=frequency_penalty,
940
935
presence_penalty=presence_penalty,
941
-
tfs_z=tfs_z,
942
936
mirostat_mode=mirostat_mode,
943
937
mirostat_tau=mirostat_tau,
944
938
mirostat_eta=mirostat_eta,
@@ -1157,7 +1151,6 @@ def _create_completion(
1157
1151
top_n_sigma: float=-1.00,
1158
1152
stream: bool=False,
1159
1153
seed: Optional[int] =None,
1160
-
tfs_z: float=1.0,
1161
1154
mirostat_mode: int=0,
1162
1155
mirostat_tau: float=5.0,
1163
1156
mirostat_eta: float=0.1,
@@ -1348,7 +1341,6 @@ def logit_bias_processor(
1348
1341
min_p=min_p,
1349
1342
typical_p=typical_p,
1350
1343
temp=temperature,
1351
-
tfs_z=tfs_z,
1352
1344
mirostat_mode=mirostat_mode,
1353
1345
mirostat_tau=mirostat_tau,
1354
1346
mirostat_eta=mirostat_eta,
@@ -1783,7 +1775,6 @@ def create_completion(
1783
1775
top_n_sigma: float=-1.00,
1784
1776
stream: bool=False,
1785
1777
seed: Optional[int] =None,
1786
-
tfs_z: float=1.0,
1787
1778
mirostat_mode: int=0,
1788
1779
mirostat_tau: float=5.0,
1789
1780
mirostat_eta: float=0.1,
@@ -1815,7 +1806,6 @@ def create_completion(
1815
1806
top_n_sigma: Limit the next token selection to a subset of tokens with pre-softmax logits that are within n * σ less than the max logit (default: -1.00, -1.00 = disabled).
1816
1807
stream: Whether to stream the results.
1817
1808
seed: The seed to use for sampling.
1818
-
tfs_z: The tail-free sampling parameter. Tail Free Sampling described in https://www.trentonbricken.com/Tail-Free-Sampling/.
1819
1809
mirostat_mode: The mirostat sampling mode.
1820
1810
mirostat_tau: The target cross-entropy (or surprise) value you want to achieve for the generated text. A higher value corresponds to more surprising or less predictable text, while a lower value corresponds to less surprising or more predictable text.
1821
1811
mirostat_eta: The learning rate used to update `mu` based on the error between the target and observed surprisal of the sampled word. A larger learning rate will cause `mu` to be updated more quickly, while a smaller learning rate will result in slower updates.
@@ -1852,7 +1842,6 @@ def create_completion(
1852
1842
top_n_sigma=top_n_sigma,
1853
1843
stream=stream,
1854
1844
seed=seed,
1855
-
tfs_z=tfs_z,
1856
1845
mirostat_mode=mirostat_mode,
1857
1846
mirostat_tau=mirostat_tau,
1858
1847
mirostat_eta=mirostat_eta,
@@ -1889,7 +1878,6 @@ def __call__(
1889
1878
top_n_sigma: float=-1.00,
1890
1879
stream: bool=False,
1891
1880
seed: Optional[int] =None,
1892
-
tfs_z: float=1.0,
1893
1881
mirostat_mode: int=0,
1894
1882
mirostat_tau: float=5.0,
1895
1883
mirostat_eta: float=0.1,
@@ -1921,7 +1909,6 @@ def __call__(
1921
1909
top_n_sigma: Limit the next token selection to a subset of tokens with pre-softmax logits that are within n * σ less than the max logit (default: -1.00, -1.00 = disabled).
1922
1910
stream: Whether to stream the results.
1923
1911
seed: The seed to use for sampling.
1924
-
tfs_z: The tail-free sampling parameter. Tail Free Sampling described in https://www.trentonbricken.com/Tail-Free-Sampling/.
1925
1912
mirostat_mode: The mirostat sampling mode.
1926
1913
mirostat_tau: The target cross-entropy (or surprise) value you want to achieve for the generated text. A higher value corresponds to more surprising or less predictable text, while a lower value corresponds to less surprising or more predictable text.
1927
1914
mirostat_eta: The learning rate used to update `mu` based on the error between the target and observed surprisal of the sampled word. A larger learning rate will cause `mu` to be updated more quickly, while a smaller learning rate will result in slower updates.
@@ -1958,7 +1945,6 @@ def __call__(
1958
1945
top_n_sigma=top_n_sigma,
1959
1946
stream=stream,
1960
1947
seed=seed,
1961
-
tfs_z=tfs_z,
1962
1948
mirostat_mode=mirostat_mode,
1963
1949
mirostat_tau=mirostat_tau,
1964
1950
mirostat_eta=mirostat_eta,
@@ -1992,7 +1978,6 @@ def create_chat_completion(
1992
1978
presence_penalty: float=0.0,
1993
1979
frequency_penalty: float=0.0,
1994
1980
repeat_penalty: float=1.0,
1995
-
tfs_z: float=1.0,
1996
1981
mirostat_mode: int=0,
1997
1982
mirostat_tau: float=5.0,
1998
1983
mirostat_eta: float=0.1,
@@ -2029,7 +2014,6 @@ def create_chat_completion(
2029
2014
presence_penalty: The penalty to apply to tokens based on their presence in the prompt.
2030
2015
frequency_penalty: The penalty to apply to tokens based on their frequency in the prompt.
2031
2016
repeat_penalty: The penalty to apply to repeated tokens.
2032
-
tfs_z: The tail-free sampling parameter.
2033
2017
mirostat_mode: The mirostat sampling mode.
2034
2018
mirostat_tau: The mirostat sampling tau parameter.
2035
2019
mirostat_eta: The mirostat sampling eta parameter.
0 commit comments