mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-28 12:24:35 +00:00
constants.py : add token types
This commit is contained in:
parent
7ec125b1dc
commit
5d518d421f
@ -38,6 +38,7 @@ KEY_ROPE_SCALE = "{llm}.rope.scale"
|
|||||||
# tokenization
|
# tokenization
|
||||||
KEY_TOKENIZER_MODEL = "tokenizer.ggml.model"
|
KEY_TOKENIZER_MODEL = "tokenizer.ggml.model"
|
||||||
KEY_TOKENIZER_LIST = "tokenizer.ggml.tokens"
|
KEY_TOKENIZER_LIST = "tokenizer.ggml.tokens"
|
||||||
|
KEY_TOKENIZER_TOKEN_TYPE = "tokenizer.ggml.token_type"
|
||||||
KEY_TOKENIZER_SCORES = "tokenizer.ggml.scores"
|
KEY_TOKENIZER_SCORES = "tokenizer.ggml.scores"
|
||||||
KEY_TOKENIZER_MERGES = "tokenizer.ggml.merges"
|
KEY_TOKENIZER_MERGES = "tokenizer.ggml.merges"
|
||||||
KEY_TOKENIZER_BOS_ID = "tokenizer.ggml.bos_token_id"
|
KEY_TOKENIZER_BOS_ID = "tokenizer.ggml.bos_token_id"
|
||||||
@ -47,8 +48,3 @@ KEY_TOKENIZER_SEP_ID = "tokenizer.ggml.seperator_token_id"
|
|||||||
KEY_TOKENIZER_PAD_ID = "tokenizer.ggml.padding_token_id"
|
KEY_TOKENIZER_PAD_ID = "tokenizer.ggml.padding_token_id"
|
||||||
KEY_TOKENIZER_HF_JSON = "tokenizer.huggingface.json"
|
KEY_TOKENIZER_HF_JSON = "tokenizer.huggingface.json"
|
||||||
KEY_TOKENIZER_RWKV = "tokenizer.rwkv.world"
|
KEY_TOKENIZER_RWKV = "tokenizer.rwkv.world"
|
||||||
KEY_TOKENIZER_BOS_ID = "tokenizer.ggml.bos_token_id"
|
|
||||||
KEY_TOKENIZER_EOS_ID = "tokenizer.ggml.eos_token_id"
|
|
||||||
KEY_TOKENIZER_UNK_ID = "tokenizer.ggml.unknown_token_id"
|
|
||||||
KEY_TOKENIZER_SEP_ID = "tokenizer.ggml.separator_token_id"
|
|
||||||
KEY_TOKENIZER_PAD_ID = "tokenizer.ggml.padding_token_id"
|
|
||||||
|
Loading…
Reference in New Issue
Block a user