Upload folder using huggingface_hub
Browse files- quant_strategy.json +3 -3
quant_strategy.json
CHANGED
|
@@ -601,7 +601,7 @@
|
|
| 601 |
},
|
| 602 |
"q_proj": {
|
| 603 |
"group_size": {
|
| 604 |
-
"
|
| 605 |
},
|
| 606 |
"bits": [
|
| 607 |
4
|
|
@@ -614,7 +614,7 @@
|
|
| 614 |
},
|
| 615 |
"k_proj": {
|
| 616 |
"group_size": {
|
| 617 |
-
"
|
| 618 |
},
|
| 619 |
"bits": [
|
| 620 |
4
|
|
@@ -696,7 +696,7 @@
|
|
| 696 |
},
|
| 697 |
"q_proj": {
|
| 698 |
"group_size": {
|
| 699 |
-
"
|
| 700 |
},
|
| 701 |
"bits": [
|
| 702 |
4
|
|
|
|
| 601 |
},
|
| 602 |
"q_proj": {
|
| 603 |
"group_size": {
|
| 604 |
+
"4": 128
|
| 605 |
},
|
| 606 |
"bits": [
|
| 607 |
4
|
|
|
|
| 614 |
},
|
| 615 |
"k_proj": {
|
| 616 |
"group_size": {
|
| 617 |
+
"4": 128
|
| 618 |
},
|
| 619 |
"bits": [
|
| 620 |
4
|
|
|
|
| 696 |
},
|
| 697 |
"q_proj": {
|
| 698 |
"group_size": {
|
| 699 |
+
"4": 128
|
| 700 |
},
|
| 701 |
"bits": [
|
| 702 |
4
|