From cf1459ff75e3eca2989b852a3b887974fc86d817 Mon Sep 17 00:00:00 2001 From: Giuseppe Franco Date: Fri, 10 Jan 2025 15:30:12 +0000 Subject: [PATCH] error out if sdpa func is not compatible --- src/brevitas_examples/llm/main.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/brevitas_examples/llm/main.py b/src/brevitas_examples/llm/main.py index ec93f14bb..61f6565ed 100644 --- a/src/brevitas_examples/llm/main.py +++ b/src/brevitas_examples/llm/main.py @@ -133,6 +133,8 @@ def model_export(model, ref_input, args): def validate(args): + if args.functional_sdpa_quant: + assert args.input_scale_type != 'dynamic' and args.input_bit_width is not None, "Functional SDPA Quant requires dynamic activation quantization" if args.rotation == 'fx': assert args.ln_affine_merge, 'Graph rotation requires to merge LN/RMS norm affine parameters' assert args.replace_rmsnorm, 'Graph rotation requires to replace HF RMSNorm with PyTorch ones (torch 2.4+ require)'