Use convert_ids_to_tokens instead of decode in logits endpoint

This preserves the llama tokenizer spaces.
2024-10-01 01:26:03 -04:00 · 2023-11-19 09:22:08 -08:00 · 2023-11-19 09:22:08 -08:00 · a2e6d00128
commit a2e6d00128
parent 8cf05c1b31
1 changed files with 4 additions and 1 deletions
--- a/modules/logits.py
+++ b/modules/logits.py
@ -55,7 +55,10 @@ def get_next_logits(prompt, state, use_samplers, previous, return_dict=False):
    if is_non_hf_exllamav1 or is_non_hf_llamacpp:
        topk_indices = [i.expand((1, 1)) for i in topk_indices]

-    tokens = [shared.tokenizer.decode(i) for i in topk_indices]
+    if hasattr(shared.tokenizer, 'convert_ids_to_tokens'):
+        tokens = [shared.tokenizer.convert_ids_to_tokens(int(i)) for i in topk_indices]
+    else:
+        tokens = [shared.tokenizer.decode(i) for i in topk_indices]

    if return_dict:
        output = {}