diff --git a/include/private/dsp/arch/x86/avx512/msmatrix.h b/include/private/dsp/arch/x86/avx512/msmatrix.h index 002fdd96..cfb1be5c 100644 --- a/include/private/dsp/arch/x86/avx512/msmatrix.h +++ b/include/private/dsp/arch/x86/avx512/msmatrix.h @@ -273,8 +273,8 @@ namespace lsp ARCH_X86_ASM( __ASM_EMIT("xor %[off], %[off]") // 64x blocks - __ASM_EMIT32("subl $32, %[count]") - __ASM_EMIT64("sub $32, %[count]") + __ASM_EMIT32("subl $64, %[count]") + __ASM_EMIT64("sub $64, %[count]") __ASM_EMIT("jb 2f") __ASM_EMIT("1:") __ASM_EMIT("vmovups 0x00(%[mid], %[off]), %%zmm0") // zmm0 = m diff --git a/src/test/utest/msmatrix/conv2.cpp b/src/test/utest/msmatrix/conv2.cpp index f22e21e4..540e3c46 100644 --- a/src/test/utest/msmatrix/conv2.cpp +++ b/src/test/utest/msmatrix/conv2.cpp @@ -1,6 +1,6 @@ /* - * Copyright (C) 2023 Linux Studio Plugins Project - * (C) 2023 Vladimir Sadovnikov + * Copyright (C) 2024 Linux Studio Plugins Project + * (C) 2024 Vladimir Sadovnikov * * This file is part of lsp-dsp-lib * Created on: 31 мар. 2020 г. @@ -85,7 +85,7 @@ UTEST_BEGIN("dsp.msmatrix", conv2) return; UTEST_FOREACH(count, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, - 32, 64, 65, 100, 999, 0xfff) + 32, 33, 34, 35, 36, 37, 38, 39, 40, 63, 64, 65, 100, 999, 0xfff) { for (size_t mask=0; mask <= 0x0f; ++mask) { diff --git a/src/test/utest/msmatrix/conv2x1.cpp b/src/test/utest/msmatrix/conv2x1.cpp index ba75853e..889e8a74 100644 --- a/src/test/utest/msmatrix/conv2x1.cpp +++ b/src/test/utest/msmatrix/conv2x1.cpp @@ -1,6 +1,6 @@ /* - * Copyright (C) 2023 Linux Studio Plugins Project - * (C) 2023 Vladimir Sadovnikov + * Copyright (C) 2024 Linux Studio Plugins Project + * (C) 2024 Vladimir Sadovnikov * * This file is part of lsp-dsp-lib * Created on: 31 мар. 2020 г. @@ -97,7 +97,7 @@ UTEST_BEGIN("dsp.msmatrix", conv2x1) return; UTEST_FOREACH(count, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, - 32, 64, 65, 100, 999, 0xfff) + 32, 33, 34, 35, 36, 37, 38, 39, 40, 63, 64, 65, 100, 999, 0xfff) { for (size_t mask=0; mask <= 0x07; ++mask) {