bdubayah baseten-admin commited on
Commit
daf5a4b
·
verified ·
1 Parent(s): 2ee0e77

Update hf_quant_config.json (#2)

Browse files

- Update hf_quant_config.json (7f7fd49789974079affecf5eaa06d6308250e930)


Co-authored-by: Baseten Admin <[email protected]>

Files changed (1) hide show
  1. hf_quant_config.json +1 -1
hf_quant_config.json CHANGED
@@ -5,7 +5,7 @@
5
  },
6
  "quantization": {
7
  "quant_algo": "NVFP4",
8
- "kv_cache_quant_algo": "FP8",
9
  "group_size": 16,
10
  "exclude_modules": [
11
  "lm_head",
 
5
  },
6
  "quantization": {
7
  "quant_algo": "NVFP4",
8
+ "kv_cache_quant_algo": null,
9
  "group_size": 16,
10
  "exclude_modules": [
11
  "lm_head",