From 16e223fbca02350c6b966b2389530e8557d8a8d7 Mon Sep 17 00:00:00 2001 From: Vulcan <93451215+trholding@users.noreply.github.com> Date: Sat, 20 Jul 2024 19:20:30 +0530 Subject: [PATCH] Update runq.c runq - Undo #pragma omp parallel sections for matmuls for now as there is no real benefit with low number of cores --- runq.c | 9 --------- 1 file changed, 9 deletions(-) diff --git a/runq.c b/runq.c index e4ea34a9..1a32da00 100644 --- a/runq.c +++ b/runq.c @@ -636,18 +636,9 @@ float* forward(Transformer* transformer, int token, int pos) { // qkv matmuls for this position quantize(&s->xq, s->xb, dim); - -// L2E Addition - #pragma omp parallel sections - { - #pragma omp section matmul(s->q, &s->xq, w->wq + l, dim, dim); - #pragma omp section matmul(s->k, &s->xq, w->wk + l, dim, kv_dim); - #pragma omp section matmul(s->v, &s->xq, w->wv + l, dim, kv_dim); - } -// END L2E Addition // RoPE relative positional encoding: complex-valued rotate q and k in each head for (int i = 0; i < dim; i+=2) {