Skip to content

Commit 95559fa

Browse files
author
zdl010
committed
Upgrade llama.cpp to b3265, support gemma2, remove beam parameter[ ggml-org/llama.cpp#7985 ]
1 parent fffa31b commit 95559fa

File tree

4 files changed

+2
-12
lines changed

4 files changed

+2
-12
lines changed

CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ FetchContent_MakeAvailable(json)
2424
FetchContent_Declare(
2525
llama.cpp
2626
GIT_REPOSITORY https://github.com/ggerganov/llama.cpp.git
27-
GIT_TAG b3008
27+
GIT_TAG b3265
2828
)
2929
FetchContent_MakeAvailable(llama.cpp)
3030

pom.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44

55
<groupId>de.kherud</groupId>
66
<artifactId>llama</artifactId>
7-
<version>3.2.1</version>
7+
<version>3.2.2</version>
88
<packaging>jar</packaging>
99

1010
<name>${project.groupId}:${project.artifactId}</name>

src/main/cpp/server.hpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2551,7 +2551,6 @@ static void server_params_parse(json jparams, server_params &sparams, gpt_params
25512551
params.n_parallel = json_value(jparams, "n_parallel", default_params.n_parallel);
25522552
params.n_sequences = json_value(jparams, "n_sequences", default_params.n_sequences);
25532553
params.p_split = json_value(jparams, "p_split", default_params.p_split);
2554-
params.n_beams = json_value(jparams, "n_beams", default_params.n_beams);
25552554
params.grp_attn_n = json_value(jparams, "grp_attn_n", default_params.grp_attn_n);
25562555
params.grp_attn_w = json_value(jparams, "grp_attn_w", default_params.grp_attn_w);
25572556
params.n_print = json_value(jparams, "n_print", default_params.n_print);

src/main/java/de/kherud/llama/ModelParameters.java

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,6 @@ public final class ModelParameters extends JsonParameters {
3232
private static final String PARAM_SPLIT_MODE = "split_mode";
3333
private static final String PARAM_MAIN_GPU = "main_gpu";
3434
private static final String PARAM_TENSOR_SPLIT = "tensor_split";
35-
private static final String PARAM_N_BEAMS = "n_beams";
3635
private static final String PARAM_GRP_ATTN_N = "grp_attn_n";
3736
private static final String PARAM_GRP_ATTN_W = "grp_attn_w";
3837
private static final String PARAM_ROPE_FREQ_BASE = "rope_freq_base";
@@ -244,14 +243,6 @@ public ModelParameters setTensorSplit(float[] tensorSplit) {
244243
return this;
245244
}
246245

247-
/**
248-
* Set usage of beam search of given width if non-zero.
249-
*/
250-
public ModelParameters setNBeams(int nBeams) {
251-
parameters.put(PARAM_N_BEAMS, String.valueOf(nBeams));
252-
return this;
253-
}
254-
255246
/**
256247
* Set the group-attention factor (default: 1)
257248
*/

0 commit comments

Comments
 (0)