mirror of
https://github.com/khoaliber/khoj.git
synced 2026-03-07 13:23:15 +00:00
Add max prompt size for gpt-3.5-turbo-16k
This commit is contained in:
@@ -14,7 +14,12 @@ import queue
|
|||||||
from khoj.utils.helpers import merge_dicts
|
from khoj.utils.helpers import merge_dicts
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
logger = logging.getLogger(__name__)
|
||||||
max_prompt_size = {"gpt-3.5-turbo": 4096, "gpt-4": 8192, "llama-2-7b-chat.ggmlv3.q4_K_S.bin": 1548}
|
max_prompt_size = {
|
||||||
|
"gpt-3.5-turbo": 4096,
|
||||||
|
"gpt-4": 8192,
|
||||||
|
"llama-2-7b-chat.ggmlv3.q4_K_S.bin": 1548,
|
||||||
|
"gpt-3.5-turbo-16k": 15000,
|
||||||
|
}
|
||||||
tokenizer = {"llama-2-7b-chat.ggmlv3.q4_K_S.bin": "hf-internal-testing/llama-tokenizer"}
|
tokenizer = {"llama-2-7b-chat.ggmlv3.q4_K_S.bin": "hf-internal-testing/llama-tokenizer"}
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user