We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 72af259 commit dead8f4Copy full SHA for dead8f4
ggml-cuda.cu
@@ -1433,7 +1433,9 @@ static __device__ __forceinline__ float vec_dot_q5_1_q8_1(
1433
const block_q5_1 * bq5_1 = (const block_q5_1 *) vbq;
1434
1435
// TODO: fix misaligned access
1436
- const int qs = *((int *) &bq5_1->qs[sizeof(int) * (iqs + 0)]);
+ int qs;
1437
+ memcpy(&qs, &bq5_1->qs[sizeof(int) * (iqs + 0)], sizeof(qs));
1438
+ //const int qs = *((int *) &bq5_1->qs[sizeof(int) * (iqs + 0)]);
1439
const int qh0 = bq5_1->qh[iqs/2 + 0] >> 4*(iqs%2);
1440
const int qh1 = bq5_1->qh[iqs/2 + 2] >> 4*(iqs%2);
1441
const int ui0 = *((int *) &bq8_1->qs[sizeof(int) * (iqs + 0)]);
0 commit comments