metal : disable fast-math for some cpy kernels (#14460)
* metal : disable fast-math for some cpy kernels ggml-ci * cont : disable for q4_1 ggml-ci * cont : disable for iq4_nl ggml-ci
This commit is contained in:
parent
a7417f5594
commit
5dd942de59
|
@ -138,6 +138,7 @@ void quantize_q4_0(device const float * src, device block_q4_0 & dst) {
|
||||||
}
|
}
|
||||||
|
|
||||||
void quantize_q4_1(device const float * src, device block_q4_1 & dst) {
|
void quantize_q4_1(device const float * src, device block_q4_1 & dst) {
|
||||||
|
#pragma METAL fp math_mode(safe)
|
||||||
float min = FLT_MAX;
|
float min = FLT_MAX;
|
||||||
float max = -FLT_MAX;
|
float max = -FLT_MAX;
|
||||||
|
|
||||||
|
@ -203,6 +204,7 @@ void quantize_q5_0(device const float * src, device block_q5_0 & dst) {
|
||||||
}
|
}
|
||||||
|
|
||||||
void quantize_q5_1(device const float * src, device block_q5_1 & dst) {
|
void quantize_q5_1(device const float * src, device block_q5_1 & dst) {
|
||||||
|
#pragma METAL fp math_mode(safe)
|
||||||
float max = src[0];
|
float max = src[0];
|
||||||
float min = src[0];
|
float min = src[0];
|
||||||
|
|
||||||
|
@ -239,6 +241,7 @@ void quantize_q5_1(device const float * src, device block_q5_1 & dst) {
|
||||||
}
|
}
|
||||||
|
|
||||||
void quantize_iq4_nl(device const float * src, device block_iq4_nl & dst) {
|
void quantize_iq4_nl(device const float * src, device block_iq4_nl & dst) {
|
||||||
|
#pragma METAL fp math_mode(safe)
|
||||||
float amax = 0.0f; // absolute max
|
float amax = 0.0f; // absolute max
|
||||||
float max = 0.0f;
|
float max = 0.0f;
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue