tomkay's picture
RAM 170GB mixed-precision quantization of Llama-4-Maverick
d61370a verified
Raw
History Blame Contribute Delete
375 Bytes
{
"backend": "tokenizers",
"bos_token": "<|begin_of_text|>",
"clean_up_tokenization_spaces": false,
"eos_token": "<|eot|>",
"is_local": true,
"model_input_names": [
"input_ids",
"attention_mask"
],
"model_max_length": 1048576,
"pad_token": "<|finetune_right_pad|>",
"processor_class": "Llama4Processor",
"tokenizer_class": "TokenizersBackend"
}