Qubitium commited on
Commit
1808ab5
·
verified ·
1 Parent(s): 79a4bea

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -0
README.md CHANGED
@@ -1,6 +1,11 @@
1
  ```
 
 
 
2
  dynamic = {
3
  # `.*\.` matches the layers_node prefix
 
 
4
  r".*\.(?:1[0-5])\..*": {"bits": 8,}, # match layer 10-15
5
  r".*\.(?:1[6-9]|20|21)\..*": {"bits": 8, "group_size": 64,}, # match layer 16-21
6
  }
 
1
  ```
2
+ # tinyllama 1.1B model has 22 layers
3
+ # layer index start at 0
4
+
5
  dynamic = {
6
  # `.*\.` matches the layers_node prefix
7
+ # last 1/2 of the layers 10-21 has 8bit vs 4bit for 0-9
8
+ # last 1/4 of the layers 16-21 has 8bit and group_size 64
9
  r".*\.(?:1[0-5])\..*": {"bits": 8,}, # match layer 10-15
10
  r".*\.(?:1[6-9]|20|21)\..*": {"bits": 8, "group_size": 64,}, # match layer 16-21
11
  }