Update README.md
Browse files
README.md
CHANGED
@@ -1,6 +1,11 @@
|
|
1 |
```
|
|
|
|
|
|
|
2 |
dynamic = {
|
3 |
# `.*\.` matches the layers_node prefix
|
|
|
|
|
4 |
r".*\.(?:1[0-5])\..*": {"bits": 8,}, # match layer 10-15
|
5 |
r".*\.(?:1[6-9]|20|21)\..*": {"bits": 8, "group_size": 64,}, # match layer 16-21
|
6 |
}
|
|
|
1 |
```
|
2 |
+
# tinyllama 1.1B model has 22 layers
|
3 |
+
# layer index start at 0
|
4 |
+
|
5 |
dynamic = {
|
6 |
# `.*\.` matches the layers_node prefix
|
7 |
+
# last 1/2 of the layers 10-21 has 8bit vs 4bit for 0-9
|
8 |
+
# last 1/4 of the layers 16-21 has 8bit and group_size 64
|
9 |
r".*\.(?:1[0-5])\..*": {"bits": 8,}, # match layer 10-15
|
10 |
r".*\.(?:1[6-9]|20|21)\..*": {"bits": 8, "group_size": 64,}, # match layer 16-21
|
11 |
}
|