Add max prompt size for gpt-3.5-turbo-16k

This commit is contained in:
sabaimran 2023-09-26 10:57:35 -07:00
parent 99f9c3f8e2
commit 588f35b6e9

View file

@ -14,7 +14,12 @@ import queue
from khoj.utils.helpers import merge_dicts
logger = logging.getLogger(__name__)
max_prompt_size = {"gpt-3.5-turbo": 4096, "gpt-4": 8192, "llama-2-7b-chat.ggmlv3.q4_K_S.bin": 1548}
max_prompt_size = {
"gpt-3.5-turbo": 4096,
"gpt-4": 8192,
"llama-2-7b-chat.ggmlv3.q4_K_S.bin": 1548,
"gpt-3.5-turbo-16k": 15000,
}
tokenizer = {"llama-2-7b-chat.ggmlv3.q4_K_S.bin": "hf-internal-testing/llama-tokenizer"}