linzhao-amd commited on
Commit
aef98c2
·
verified ·
1 Parent(s): 464058f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -56,7 +56,7 @@ python3 quantize_quark.py --model_dir "${MODEL}" \
56
  --model_export hf_format \
57
  --custom_mode fp8 \
58
  --quant_algo autosmoothquant \
59
- --exclude_layers "lm_head" "*.gate"
60
  ```
61
 
62
  # Model Performance Comparison
 
56
  --model_export hf_format \
57
  --custom_mode fp8 \
58
  --quant_algo autosmoothquant \
59
+ --exclude_layers "lm_head" "*.gate" "*.o_proj"
60
  ```
61
 
62
  # Model Performance Comparison