Safetensors
English
llama
File size: 422 Bytes
52ed9af
f3d9037
 
52ed9af
f3d9037
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
# Inference config for CALM-8B.
#
# Usage:
#   oumi infer -i -c ./oumi_infer.yaml
#

model:
  model_name: "uiuc-convai/CALM-8B"
  adapter_model: null  # Update for LoRA-tuned models.
  model_max_length: 2048  # Update based on your hardware constraints
  torch_dtype_str: "bfloat16"
  attn_implementation: "sdpa"
  load_pretrained_weights: True
  trust_remote_code: True

generation:
  max_new_tokens: 2048

engine: NATIVE