mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-05-01 14:44:33 +02:00
llamafile: use member variable instead of constant for iq4nlt (llama/11780)
This commit is contained in:
parent
4e07957bf9
commit
defe731263
@ -280,14 +280,6 @@ template <> inline __m256bh load(const float *p) {
|
|||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////////
|
|
||||||
// CONSTANTS
|
|
||||||
|
|
||||||
#if defined(__AVX__) || defined(__AVX2__) || defined(__AVX512F__)
|
|
||||||
static const int8_t kvalues_iq4nl[16] = {-127, -104, -83, -65, -49, -35, -22, -10, 1, 13, 25, 38, 53, 69, 89, 113};
|
|
||||||
static const __m128i iq4nlt = _mm_loadu_si128((const __m128i *) kvalues_iq4nl);
|
|
||||||
#endif
|
|
||||||
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////////
|
////////////////////////////////////////////////////////////////////////////////////////////////////
|
||||||
// FLOATING POINT MATRIX MULTIPLICATION
|
// FLOATING POINT MATRIX MULTIPLICATION
|
||||||
|
|
||||||
@ -614,6 +606,14 @@ class tinyBLAS_Q0_AVX {
|
|||||||
TC *C, int64_t ldc,
|
TC *C, int64_t ldc,
|
||||||
int ith, int nth)
|
int ith, int nth)
|
||||||
: A(A), B(B), C(C), k(k), lda(lda), ldb(ldb), ldc(ldc), ith(ith), nth(nth) {
|
: A(A), B(B), C(C), k(k), lda(lda), ldb(ldb), ldc(ldc), ith(ith), nth(nth) {
|
||||||
|
const int8_t kvalues_iq4nl[16] = {
|
||||||
|
-127, -104, -83, -65,
|
||||||
|
-49, -35, -22, -10,
|
||||||
|
1, 13, 25, 38,
|
||||||
|
53, 69, 89, 113
|
||||||
|
};
|
||||||
|
|
||||||
|
iq4nlt = _mm_loadu_si128((const __m128i *)kvalues_iq4nl);
|
||||||
}
|
}
|
||||||
|
|
||||||
void matmul(int64_t m, int64_t n) {
|
void matmul(int64_t m, int64_t n) {
|
||||||
@ -1038,6 +1038,7 @@ class tinyBLAS_Q0_AVX {
|
|||||||
const int64_t ldc;
|
const int64_t ldc;
|
||||||
const int ith;
|
const int ith;
|
||||||
const int nth;
|
const int nth;
|
||||||
|
__m128i iq4nlt;
|
||||||
};
|
};
|
||||||
#endif // __AVX__
|
#endif // __AVX__
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user