@@ -141,20 +141,6 @@ typedef sycl::half2 ggml_half2;
141
141
142
142
#endif // GGML_COMMON_DECL_CUDA || GGML_COMMON_DECL_HIP
143
143
144
- // 1.625 bpw for BitNet b1.58 models
145
- #define QK1_3 64
146
- typedef struct {
147
- uint8_t q[(QK1_3 - 4 *QK1_3/64 )/5 ]; // 5 elements per byte (3^5 = 243 < 256)
148
- uint8_t qs[QK1_3/64 ]; // 4 elements per byte
149
- } block_q1_3;
150
- static_assert (sizeof (block_q1_3) == (QK1_3 - 4 *QK1_3/64 )/5 + QK1_3/64, "wrong q1_3 block size/padding");
151
-
152
- #define QK2_2 32
153
- typedef struct {
154
- uint8_t qs[QK2_2 / 4 ]; // nibbles / quants
155
- } block_q2_2;
156
- static_assert (sizeof (block_q2_2) == QK2_2 / 4, "wrong q2_2 block size/padding");
157
-
158
144
#define QK4_0 32
159
145
typedef struct {
160
146
ggml_half d; // delta
@@ -1084,41 +1070,6 @@ GGML_TABLE_BEGIN(uint32_t, iq3s_grid, 512)
1084
1070
0x0f090307 , 0x0f090501 , 0x0f090b01 , 0x0f0b0505 , 0x0f0b0905 , 0x0f0d0105 , 0x0f0d0703 , 0x0f0f0101 ,
1085
1071
GGML_TABLE_END ()
1086
1072
1087
- GGML_TABLE_BEGIN (uint32_t , q1_3_grid, 256 )
1088
- 0xffffffff , 0xffffffff , 0xffffff00 , 0xffffff01 , 0xffff00ff , 0xffff0000 , 0xffff0001 , 0xffff01ff ,
1089
- 0xffff0100 , 0xffff0101 , 0xff00ffff , 0xff00ff00 , 0xff00ff01 , 0xff0000ff , 0xff000000 , 0xff000001 ,
1090
- 0xff0001ff , 0xff000100 , 0xff000101 , 0xff01ffff , 0xff01ffff , 0xff01ff00 , 0xff01ff01 , 0xff0100ff ,
1091
- 0xff010000 , 0xff010001 , 0xff0101ff , 0xff010100 , 0xff010101 , 0x00ffffff , 0x00ffff00 , 0x00ffff01 ,
1092
- 0x00ff00ff , 0x00ff0000 , 0x00ff0001 , 0x00ff01ff , 0x00ff0100 , 0x00ff0101 , 0x0000ffff , 0x0000ff00 ,
1093
- 0x0000ff00 , 0x0000ff01 , 0x000000ff , 0x00000000 , 0x00000001 , 0x000001ff , 0x00000100 , 0x00000101 ,
1094
- 0x0001ffff , 0x0001ff00 , 0x0001ff01 , 0x000100ff , 0x00010000 , 0x00010001 , 0x000101ff , 0x00010100 ,
1095
- 0x00010101 , 0x01ffffff , 0x01ffff00 , 0x01ffff01 , 0x01ffff01 , 0x01ff00ff , 0x01ff0000 , 0x01ff0001 ,
1096
- 0x01ff01ff , 0x01ff0100 , 0x01ff0101 , 0x0100ffff , 0x0100ff00 , 0x0100ff01 , 0x010000ff , 0x01000000 ,
1097
- 0x01000001 , 0x010001ff , 0x01000100 , 0x01000101 , 0x0101ffff , 0x0101ff00 , 0x0101ff01 , 0x0101ff01 ,
1098
- 0x010100ff , 0x01010000 , 0x01010001 , 0x010101ff , 0x01010100 , 0x01010101 , 0xffffffff , 0xffffff00 ,
1099
- 0xffffff01 , 0xffff00ff , 0xffff0000 , 0xffff0001 , 0xffff01ff , 0xffff0100 , 0xffff0101 , 0xff00ffff ,
1100
- 0xff00ff00 , 0xff00ff01 , 0xff0000ff , 0xff0000ff , 0xff000000 , 0xff000001 , 0xff0001ff , 0xff000100 ,
1101
- 0xff000101 , 0xff01ffff , 0xff01ff00 , 0xff01ff01 , 0xff0100ff , 0xff010000 , 0xff010001 , 0xff0101ff ,
1102
- 0xff010100 , 0xff010101 , 0x00ffffff , 0x00ffff00 , 0x00ffff01 , 0x00ff00ff , 0x00ff0000 , 0x00ff0000 ,
1103
- 0x00ff0001 , 0x00ff01ff , 0x00ff0100 , 0x00ff0101 , 0x0000ffff , 0x0000ff00 , 0x0000ff01 , 0x000000ff ,
1104
- 0x00000000 , 0x00000001 , 0x000001ff , 0x00000100 , 0x00000101 , 0x0001ffff , 0x0001ff00 , 0x0001ff01 ,
1105
- 0x000100ff , 0x00010000 , 0x00010000 , 0x00010001 , 0x000101ff , 0x00010100 , 0x00010101 , 0x01ffffff ,
1106
- 0x01ffff00 , 0x01ffff01 , 0x01ff00ff , 0x01ff0000 , 0x01ff0001 , 0x01ff01ff , 0x01ff0100 , 0x01ff0101 ,
1107
- 0x0100ffff , 0x0100ff00 , 0x0100ff01 , 0x010000ff , 0x01000000 , 0x01000001 , 0x01000001 , 0x010001ff ,
1108
- 0x01000100 , 0x01000101 , 0x0101ffff , 0x0101ff00 , 0x0101ff01 , 0x010100ff , 0x01010000 , 0x01010001 ,
1109
- 0x010101ff , 0x01010100 , 0x01010101 , 0xffffffff , 0xffffff00 , 0xffffff01 , 0xffff00ff , 0xffff0000 ,
1110
- 0xffff0001 , 0xffff01ff , 0xffff01ff , 0xffff0100 , 0xffff0101 , 0xff00ffff , 0xff00ff00 , 0xff00ff01 ,
1111
- 0xff0000ff , 0xff000000 , 0xff000001 , 0xff0001ff , 0xff000100 , 0xff000101 , 0xff01ffff , 0xff01ff00 ,
1112
- 0xff01ff01 , 0xff0100ff , 0xff010000 , 0xff010001 , 0xff0101ff , 0xff0101ff , 0xff010100 , 0xff010101 ,
1113
- 0x00ffffff , 0x00ffff00 , 0x00ffff01 , 0x00ff00ff , 0x00ff0000 , 0x00ff0001 , 0x00ff01ff , 0x00ff0100 ,
1114
- 0x00ff0101 , 0x0000ffff , 0x0000ff00 , 0x0000ff01 , 0x000000ff , 0x00000000 , 0x00000001 , 0x000001ff ,
1115
- 0x00000100 , 0x00000100 , 0x00000101 , 0x0001ffff , 0x0001ff00 , 0x0001ff01 , 0x000100ff , 0x00010000 ,
1116
- 0x00010001 , 0x000101ff , 0x00010100 , 0x00010101 , 0x01ffffff , 0x01ffff00 , 0x01ffff01 , 0x01ff00ff ,
1117
- 0x01ff0000 , 0x01ff0001 , 0x01ff01ff , 0x01ff0100 , 0x01ff0101 , 0x01ff0101 , 0x0100ffff , 0x0100ff00 ,
1118
- 0x0100ff01 , 0x010000ff , 0x01000000 , 0x01000001 , 0x010001ff , 0x01000100 , 0x01000101 , 0x0101ffff ,
1119
- 0x0101ff00 , 0x0101ff01 , 0x010100ff , 0x01010000 , 0x01010001 , 0x010101ff , 0x01010100 , 0x01010101 ,
1120
- GGML_TABLE_END ()
1121
-
1122
1073
#define NGRID_IQ1S 2048
1123
1074
#define IQ1S_DELTA 0 .125f
1124
1075
#define IQ1M_DELTA 0 .125f
0 commit comments