diff --git a/olmocr/train/quantization_configs/qwen2_5vl_w8a8_int8.yaml b/olmocr/train/quantization_configs/qwen2_5vl_w8a8_int8.yaml index 763b726..302b1f0 100644 --- a/olmocr/train/quantization_configs/qwen2_5vl_w8a8_int8.yaml +++ b/olmocr/train/quantization_configs/qwen2_5vl_w8a8_int8.yaml @@ -3,6 +3,4 @@ quantization_stage: GPTQModifier: targets: [Linear] ignore: ['re:.*lm_head', 're:model.visual.*'] - weights: - num_bits: 8 - type: int \ No newline at end of file + scheme: W8A8 \ No newline at end of file