Update ggml/src/ggml-cuda/dmmv.cu
Co-authored-by: Johannes Gäßler <johannesg@5d6.de>
This commit is contained in:
parent
d07dc44c63
commit
d150c7e309
1 changed files with 1 additions and 4 deletions
|
@ -480,10 +480,7 @@ static __global__ void dequantize_mul_mat_vec(const void * __restrict__ vx, cons
|
||||||
if ( y_offset == 1 ) {
|
if ( y_offset == 1 ) {
|
||||||
// load 2 dfloats into register in a single instruction
|
// load 2 dfloats into register in a single instruction
|
||||||
const dfloat2 y_reg = *((dfloat2 *) &(y[iybs + iqs + j/qr]));
|
const dfloat2 y_reg = *((dfloat2 *) &(y[iybs + iqs + j/qr]));
|
||||||
tmp += __hmul2(v, {
|
tmp += __hmul2(v, y_reg);
|
||||||
y_reg.x;
|
|
||||||
y_reg.y;
|
|
||||||
});
|
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
tmp += __hmul2(v, {
|
tmp += __hmul2(v, {
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue