Update README.md
Browse files
README.md
CHANGED
|
@@ -90,8 +90,8 @@ In the `convert.py` file of mlx-lm on your system ( [you can see the original co
|
|
| 90 |
q_bits = 3
|
| 91 |
if "switch_mlp.down_proj" in path:
|
| 92 |
q_bits = 3
|
| 93 |
-
# Blocks
|
| 94 |
-
if
|
| 95 |
q_bits = 6
|
| 96 |
# Every 5th block is "medium" quality
|
| 97 |
if (index % 5) == 0:
|
|
@@ -105,8 +105,8 @@ Should you wish to squeeze more out of your quant, and you do not need to use a
|
|
| 105 |
```python
|
| 106 |
if "switch_mlp.down_proj" in path:
|
| 107 |
q_bits = 4
|
| 108 |
-
# Blocks
|
| 109 |
-
if
|
| 110 |
q_bits = 6
|
| 111 |
#print("path:", path, "index:", index, "q_bits:", q_bits)
|
| 112 |
return {"group_size": group_size, "bits": q_bits}
|
|
|
|
| 90 |
q_bits = 3
|
| 91 |
if "switch_mlp.down_proj" in path:
|
| 92 |
q_bits = 3
|
| 93 |
+
# Blocks up to 5 are higher quality
|
| 94 |
+
if index < 5:
|
| 95 |
q_bits = 6
|
| 96 |
# Every 5th block is "medium" quality
|
| 97 |
if (index % 5) == 0:
|
|
|
|
| 105 |
```python
|
| 106 |
if "switch_mlp.down_proj" in path:
|
| 107 |
q_bits = 4
|
| 108 |
+
# Blocks up to 5 are higher quality
|
| 109 |
+
if index < 5:
|
| 110 |
q_bits = 6
|
| 111 |
#print("path:", path, "index:", index, "q_bits:", q_bits)
|
| 112 |
return {"group_size": group_size, "bits": q_bits}
|