dual-lm-470m / tokenizer_config.json
davda54's picture
Upload 6 files
3af89f7 verified
{
"tokenizer_class": "PreTrainedTokenizerFast",
"bos_token": "<s>",
"eos_token": "</s>",
"unk_token": "<unk>",
"pad_token": "<pad>",
"mask_token": "<mask>",
"model_max_length": 2048,
"clean_up_tokenization_spaces": false,
"added_tokens_decoder": {
"0": {"content": "<unk>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"1": {"content": "<s>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"2": {"content": "</s>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"3": {"content": "<pad>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"4": {"content": "<mask>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"5": {"content": "<special_0>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"6": {"content": "<special_1>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"7": {"content": "<special_2>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"8": {"content": "<special_3>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"9": {"content": "<special_4>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"10": {"content": "<special_5>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"11": {"content": "<special_6>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"12": {"content": "<special_7>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"13": {"content": "<special_8>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"14": {"content": "<special_9>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true},
"15": {"content": "<special_10>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true}
}
}