examples : utilize new llama_get_logits_ith()

This commit is contained in:
Georgi Gerganov 2023-09-28 16:05:37 +03:00
parent 4c72ab13b2
commit d008733e6b
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
3 changed files with 3 additions and 3 deletions

View File

@ -905,7 +905,7 @@ llama_token llama_sample_token(
llama_token id = 0;
float * logits = llama_get_logits(ctx) + idx * n_vocab;
float * logits = llama_get_logits_ith(ctx, idx);
// Apply params.logit_bias map
for (auto it = params.logit_bias.begin(); it != params.logit_bias.end(); it++) {

View File

@ -183,7 +183,7 @@ std::string llama_detokenize_bpe(
// - ctx_guidance: context to use for classifier-free guidance, ignore if NULL
// - grammar: grammar to use for sampling, ignore if NULL
// - last_tokens: needed for repetition penalty, ignore if empty
// - idx: sample from llama_get_logits(ctx) + idx * n_vocab
// - idx: sample from llama_get_logits_ith(ctx, idx)
//
// returns:
// - token: sampled token

View File

@ -150,7 +150,7 @@ int main(int argc, char ** argv) {
}
auto n_vocab = llama_n_vocab(ctx);
auto logits = llama_get_logits(ctx) + i_batch[i] * n_vocab;
auto logits = llama_get_logits_ith(ctx, i_batch[i]);
std::vector<llama_token_data> candidates;
candidates.reserve(n_vocab);