Skip to content

Commit ffc7272

Browse files
authored
sampling : make top_n_sigma no-op at <=0 or a single candidate (#13345)
1 parent 91a86a6 commit ffc7272

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

src/llama-sampling.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -1750,7 +1750,7 @@ static const char * llama_sampler_top_n_sigma_name(const struct llama_sampler *
17501750
static void llama_sampler_top_n_sigma_apply(struct llama_sampler * smpl, llama_token_data_array * cur_p) {
17511751
const auto * ctx = (llama_sampler_top_n_sigma *) smpl->ctx;
17521752

1753-
if (ctx->n < 0.0f) {
1753+
if (ctx->n <= 0.0f || cur_p->size <= 1) {
17541754
return;
17551755
}
17561756

tests/test-sampling.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -360,7 +360,7 @@ int main(void) {
360360
test_dry({0.2f, 0.2f, 0.2f, 0.2f, 0.2f}, {0, 1, 2, 3, 4, 0, 1}, {0.2f, 0.2f, 0.2f, 0.2f, 0.2f}, 1.0f, 1.1f, 4, 7, {});
361361

362362
test_top_n_sigma({0.1f, 0.2f, 0.3f, 0.4f}, {0.571429f, 0.428571f, 0.0f, 0.0f}, 1.00f);
363-
test_top_n_sigma({0.1f, 0.2f, 0.3f, 0.4f}, {1.0f, 0.0f, 0.0f, 0.0f}, 0.00f);
363+
test_top_n_sigma({0.1f, 0.2f, 0.3f, 0.4f}, {0.4f, 0.3f, 0.2f, 0.1f}, 0.00f); // top_n_sigma == 0 now represents a no-op rather than greedy decoding as of PR#13345
364364
test_top_n_sigma({0.1f, 0.2f, 0.3f, 0.4f}, {0.4f, 0.3f, 0.2f, 0.1f}, 3.00f);
365365

366366
test_sampler_queue(10000, "k", 10000, 1.0f, 1.0f);

0 commit comments

Comments
 (0)