name: llama-3.1 backend: transformers parameters: model: fakezeta/Meta-Llama-3.1-8B-Instruct-ov-int8 context_size: 8192 type: OVModelForCausalLM template: use_tokenizer_template: true