diff options
| author | Konstantin <const@const.me> | 2023-01-23 17:44:18 +0100 |
|---|---|---|
| committer | Konstantin <const@const.me> | 2023-01-23 17:44:18 +0100 |
| commit | 39c834d571f8ba1dc35483266dda275382c96a1c (patch) | |
| tree | 2ed4ffbada39f2d303fda2ac2b5d53e843fadce0 | |
| parent | 01325d7168669f8d05446314f8b53c62e7de3af9 (diff) | |
Minor, performance and VRAM use
| -rw-r--r-- | Whisper/Whisper/WhisperContext.cpp | 5 |
1 files changed, 2 insertions, 3 deletions
diff --git a/Whisper/Whisper/WhisperContext.cpp b/Whisper/Whisper/WhisperContext.cpp index 823d207..9e62766 100644 --- a/Whisper/Whisper/WhisperContext.cpp +++ b/Whisper/Whisper/WhisperContext.cpp @@ -478,11 +478,10 @@ Tensor WhisperContext::decodeLayer( const Tensor& inpL, size_t il, const sLayerD { profiler.setNextTag( "dec.layer.6" ); cur = mulMat( layer.attnLn1.w, cur ); - addRepeat( cur, layer.attnLn1.b ); } - // add the input - Tensor inpCA = add( cur, inpL ); + addRepeatEx( cur, layer.attnLn1.b, inpL ); + Tensor inpCA = cur; // norm { |
