Merge pull request #43 from krzysztof-jusiak/rmsnorm

Speed up rmsnorm by using sqrtf/expf
This commit is contained in:
Andrej
2023-07-24 14:13:49 -07:00
committed by GitHub
+2 -2
View File
@@ -184,7 +184,7 @@ void rmsnorm(float* o, float* x, float* weight, int size) {
}
ss /= size;
ss += 1e-5f;
ss = 1.0f / sqrt(ss);
ss = 1.0f / sqrtf(ss);
// normalize and scale
for (int j = 0; j < size; j++) {
o[j] = weight[j] * (ss * x[j]);
@@ -202,7 +202,7 @@ void softmax(float* x, int size) {
// exp and sum
float sum = 0.0f;
for (int i = 0; i < size; i++) {
x[i] = exp(x[i] - max_val);
x[i] = expf(x[i] - max_val);
sum += x[i];
}
// normalize