From ed697d97e349f2439897712188b719141498c1ff Mon Sep 17 00:00:00 2001 From: Derzhavin Dmitry Date: Tue, 26 Apr 2022 10:15:26 +0300 Subject: [PATCH 1/3] nmppsCmpEq0__nm16u15b wtw++ --- src/nmplv/Select/nm/VEC_CmpEq0__nm16u15b.asm | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/nmplv/Select/nm/VEC_CmpEq0__nm16u15b.asm b/src/nmplv/Select/nm/VEC_CmpEq0__nm16u15b.asm index 7cfeb057..8e7de547 100644 --- a/src/nmplv/Select/nm/VEC_CmpEq0__nm16u15b.asm +++ b/src/nmplv/Select/nm/VEC_CmpEq0__nm16u15b.asm @@ -106,6 +106,7 @@ global _nmppsCmpEq0_16u15b:label; .repeat 6; rep 32 data = [ar0++gr0], ftw with vsum, activate data, afifo; //WTW_REG_DEPRICATED(gr5); + wtw; ar0-=1022; .endrepeat; rep 32 wfifo = [ar4++], ftw; @@ -158,4 +159,4 @@ global _nmppsCmpEq0_16u15b:label; end ".text_nmplv"; //********************************************************************/ // END OF FILE BoolConvert16to1.asm */ -//********************************************************************/ \ No newline at end of file +//********************************************************************/ From 52589ce221fb4d5c8f8e348b5a3e1b864efa3a8f Mon Sep 17 00:00:00 2001 From: Derzhavin Dmitry Date: Tue, 26 Apr 2022 13:26:10 +0300 Subject: [PATCH 2/3] nmppsMul_AddC_64s opened for nmc4 --- src/nmplv/Arithmetics/nm/VEC_MulV_AddC__nm64s.asm | 2 -- 1 file changed, 2 deletions(-) diff --git a/src/nmplv/Arithmetics/nm/VEC_MulV_AddC__nm64s.asm b/src/nmplv/Arithmetics/nm/VEC_MulV_AddC__nm64s.asm index 08c1d6be..e745a446 100644 --- a/src/nmplv/Arithmetics/nm/VEC_MulV_AddC__nm64s.asm +++ b/src/nmplv/Arithmetics/nm/VEC_MulV_AddC__nm64s.asm @@ -23,7 +23,6 @@ begin ".text_nmplv" -.if .nm64revision == 5; ///////////////////////////////////////////////////////////////////////////////////////// @@ -72,6 +71,5 @@ global _nmppsMul_AddC_64s:label; return; .wait; -.endif; end ".text_nmplv"; From 8de5c2a885236a962e20085b54c523294ecaa9f6 Mon Sep 17 00:00:00 2001 From: Derzhavin Dmitry Date: Tue, 26 Apr 2022 15:15:02 +0300 Subject: [PATCH 3/3] Added nmppsSub_8s for pc --- src/nmplv/Arithmetics/pc/nmpps-Sub.c | 15 ++++++++++++--- 1 file changed, 12 insertions(+), 3 deletions(-) diff --git a/src/nmplv/Arithmetics/pc/nmpps-Sub.c b/src/nmplv/Arithmetics/pc/nmpps-Sub.c index 854cc051..7fef5ce4 100644 --- a/src/nmplv/Arithmetics/pc/nmpps-Sub.c +++ b/src/nmplv/Arithmetics/pc/nmpps-Sub.c @@ -22,9 +22,18 @@ #include "nmtype.h" ///////////////////////////////////////////////////////////////////////////////////////// // Subtraction of two char buffers -// 2826 ticks per 10240 elements with C++ call (0.276 clocks per element) -// The order of intermediate data transmissions in function is: -// Buf1[],Buf2 => pDstVec[] - Subtraction (in-place is supported) +void nmppsSub_8s( + const nm8s* pSrcVec1, // input buffer :long Local [VecSize/4] + const nm8s* pSrcVec2, // input buffer :long Local [VecSize/4] + nm8s* pDstVec, // output buffer :long Global[VecSize/4] + int nSize // size of input buffer in 8-bit elements. nSize=[0,8,16,24..] + ) +{ + int i; + for (i=0; i