Displaying 12 results from an estimated 12 matches for "in8".
Did you mean:
in
2017 Feb 07
2
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...in4(s0))
> PROC( in0(s5) in1(s4) in2(s3) in3(s2) in4(s1) in5(s0))
> PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1) in6(s0))
> PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1) in7(s0))
> PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1) in8(s0))
> PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1) in9(s0))
> PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2) in9(s1)in10(s0))
> PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3) in9(s2)in10(s1)in11(s0))
> ...and so on until the end of the input vector
>
> The dif...
2017 Feb 07
3
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...in0(s5) in1(s4) in2(s3) in3(s2) in4(s1) in5(s0))
> > PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1) in6(s0))
> > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1) in7(s0))
> > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1) in8(s0))
> > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1) in9(s0))
> > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2) in9(s1)in10(s0))
> > PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3) in9(s2)in10(s1)in11(s0))
> > ...and so on until the end o...
2017 Feb 06
0
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...s3) in2(s2) in3(s1) in4(s0))
PROC( in0(s5) in1(s4) in2(s3) in3(s2) in4(s1) in5(s0))
PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1) in6(s0))
PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1) in7(s0))
PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1) in8(s0))
PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1) in9(s0))
PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2) in9(s1)in10(s0))
PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3) in9(s2)in10(s1)in11(s0))
...and so on until the end of the input vector
The difference is that it's now...
2017 Feb 06
2
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
Hi Jean-Marc,
Thanks a lot for reviewing this huge assembly function!
silk_warped_autocorrelation_FIX_c()'s kernel part is
for( n = 0; n < length; n++ ) {
tmp1_QS = silk_LSHIFT32( (opus_int32)input[ n ], QS );
/* Loop over allpass sections */
for( i = 0; i < order; i++ ) {
/* Output of allpass section */
tmp2_QS = silk_SMLAWB(
2017 Apr 05
2
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...t;> > PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1)
>>> in6(s0))
>>> > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1)
>>> in7(s0))
>>> > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1)
>>> in8(s0))
>>> > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1)
>>> in9(s0))
>>> > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2)
>>> in9(s1)in10(s0))
>>> > PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3)
>>> in9(...
2017 Feb 07
0
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...PROC( in0(s5) in1(s4) in2(s3) in3(s2) in4(s1) in5(s0))
> PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1) in6(s0))
> PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1) in7(s0))
> PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1) in8(s0))
> PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1) in9(s0))
> PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2) in9(s1)in10(s0))
> PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3) in9(s2)in10(s1)in11(s0))
> ...and so on until the end of the input vector
&...
2017 Apr 03
0
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...>> in5(s0))
>> > PROC( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2) in5(s1)
>> in6(s0))
>> > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2) in6(s1)
>> in7(s0))
>> > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2) in7(s1)
>> in8(s0))
>> > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2) in8(s1)
>> in9(s0))
>> > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2)
>> in9(s1)in10(s0))
>> > PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s3)
>> in9(s2)in10(s1)in11(s0))
>...
2017 Apr 05
4
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...in2(s4) in3(s3) in4(s2)
> > in5(s1) in6(s0))
> > > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2)
> > in6(s1) in7(s0))
> > > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2)
> > in7(s1) in8(s0))
> > > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2)
> > in8(s1) in9(s0))
> > > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2)
> > in9(s1)in10(s0))
> > > PROC(in4(s7) in5(...
2017 Apr 05
0
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...( in0(s6) in1(s5) in2(s4) in3(s3) in4(s2)
> in5(s1) in6(s0))
> > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2)
> in6(s1) in7(s0))
> > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2)
> in7(s1) in8(s0))
> > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2)
> in8(s1) in9(s0))
> > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2)
> in9(s1)in10(s0))
> > PROC(in4(s7) in5(s6) in6(s5) in7(s4) in8(s...
2008 Sep 08
2
[LLVMdev] Overzealous PromoteCastOfAllocation
...uses=1]
%A12 = shl i32 %A1, 16 ; <i32> [#uses=1]
%V.in.mask = and i32 undef, 65535 ; <i32> [#uses=1]
%A12.ins = or i32 %V.in.mask, %A12 ; <i32> [#uses=1]
%B9 = zext i16 %B to i32 ; <i32> [#uses=1]
%V.in8.mask = and i32 %A12.ins, -65536 ; <i32> [#uses=1]
%B9.ins = or i32 %V.in8.mask, %B9 ; <i32> [#uses=2]
%R14 = lshr i32 %B9.ins, 16 ; <i32> [#uses=1]
%R15 = trunc i32 %R14 to i16 ; <i16> [#uses=1]
%R27 = trunc i...
2017 Apr 06
0
[PATCH] Optimize silk_warped_autocorrelation_FIX() for ARM NEON
...s2)
> > in5(s1) in6(s0))
> > > PROC(in0(s7) in1(s6) in2(s5) in3(s4) in4(s3) in5(s2)
> > in6(s1) in7(s0))
> > > PROC(in1(s7) in2(s6) in3(s5) in4(s4) in5(s3) in6(s2)
> > in7(s1) in8(s0))
> > > PROC(in2(s7) in3(s6) in4(s5) in5(s4) in6(s3) in7(s2)
> > in8(s1) in9(s0))
> > > PROC(in3(s7) in4(s6) in5(s5) in6(s4) in7(s3) in8(s2)
> > in9(s1)in10(s0))
> > >...
2008 Sep 08
0
[LLVMdev] Overzealous PromoteCastOfAllocation
...shl i32 %A1, 16 ; <i32> [#uses=1]
> %V.in.mask = and i32 undef, 65535 ; <i32> [#uses=1]
> %A12.ins = or i32 %V.in.mask, %A12 ; <i32> [#uses=1]
> %B9 = zext i16 %B to i32 ; <i32> [#uses=1]
> %V.in8.mask = and i32 %A12.ins, -65536 ; <i32> [#uses=1]
> %B9.ins = or i32 %V.in8.mask, %B9 ; <i32> [#uses=2]
> %R14 = lshr i32 %B9.ins, 16 ; <i32> [#uses=1]
> %R15 = trunc i32 %R14 to i16 ; <i16> [#uses=1]
>...