X-Git-Url: https://oss.titaniummirror.com/gitweb?p=msp430-binutils.git;a=blobdiff_plain;f=gas%2Ftestsuite%2Fgas%2Fbfin%2Fvideo2.s;fp=gas%2Ftestsuite%2Fgas%2Fbfin%2Fvideo2.s;h=22fb50f3e5979aca660b07f1bf0475a73fb74f73;hp=16b0ff11730da29fc67cc3b6a29554a90158a7bd;hb=d5da4f291af551c0b8b79e1d4a9b173d60e5c10e;hpb=7b5ea4fcdf2819e070665ab5610f8b48e3867c10 diff --git a/gas/testsuite/gas/bfin/video2.s b/gas/testsuite/gas/bfin/video2.s index 16b0ff1..22fb50f 100755 --- a/gas/testsuite/gas/bfin/video2.s +++ b/gas/testsuite/gas/bfin/video2.s @@ -1,220 +1,220 @@ - -.EXTERN MY_LABEL2; -.section .text; - -// -//13 VIDEO PIXEL OPERATIONS -// - -//Dreg = ALIGN8 ( Dreg, Dreg ) ; /* overlay 1 byte (b) */ -R0 = ALIGN8(R0, R0); -R0 = ALIGN8(R0, R1); -R0 = ALIGN8(R1, R0); -R0 = ALIGN8(R1, R1); -R0 = ALIGN8(R1, R2); -R3 = ALIGN8(R4, R5); -R6 = ALIGN8(R7, R0); -R1 = ALIGN8(R2, R3); -R4 = ALIGN8(R5, R6); -R7 = ALIGN8(R0, R1); -R2 = ALIGN8(R3, R4); -R5 = ALIGN8(R6, R7); - -//Dreg = ALIGN16 ( Dreg, Dreg ) ; /* overlay 2 bytes (b) */ -R0 = ALIGN16(R0, R0); -R0 = ALIGN16(R0, R1); -R0 = ALIGN16(R1, R0); -R0 = ALIGN16(R1, R1); -R0 = ALIGN16(R1, R2); -R3 = ALIGN16(R4, R5); -R6 = ALIGN16(R7, R0); -R1 = ALIGN16(R2, R3); -R4 = ALIGN16(R5, R6); -R7 = ALIGN16(R0, R1); -R2 = ALIGN16(R3, R4); -R5 = ALIGN16(R6, R7); - -//Dreg = ALIGN24 ( Dreg, Dreg ) ; /* overlay 3 bytes (b) */ -R0 = ALIGN24(R0, R0); -R0 = ALIGN24(R0, R1); -R0 = ALIGN24(R1, R0); -R0 = ALIGN24(R1, R1); -R0 = ALIGN24(R1, R2); -R3 = ALIGN24(R4, R5); -R6 = ALIGN24(R7, R0); -R1 = ALIGN24(R2, R3); -R4 = ALIGN24(R5, R6); -R7 = ALIGN24(R0, R1); -R2 = ALIGN24(R3, R4); -R5 = ALIGN24(R6, R7); - -DISALGNEXCPT ; /* (b) */ - -/* forward byte order operands */ -//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (LO) ; /* sum into low bytes (b) */ -//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (HI) ; /* sum into high bytes (b) */ -/* reverse byte order operands */ -//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (LO, R) ; /* sum into low bytes (b) */ -//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (HI, R) ; /* sum into high bytes (b) */ - -r0 = byteop3p (r1:0, r3:2) (lo) ; -r1 = byteop3p (r1:0, r3:2) (hi) ; -r2 = byteop3p (r1:0, r3:2) (lo, r) ; -r3 = byteop3p (r1:0, r3:2) (hi, r) ; -r4 = byteop3p (r3:2, r1:0) (lo) ; -r5 = byteop3p (r3:2, r1:0) (hi) ; -r6 = byteop3p (r3:2, r1:0) (lo, r) ; -r7 = byteop3p (r3:2, r1:0) (hi, r) ; - -//Dreg = A1.L + A1.H, Dreg = A0.L + A0.H ; /* (b) */ - -R0 = A1.L + A1.H, R0= A0.L + A0.H ; -R0 = A1.L + A1.H, R1= A0.L + A0.H ; -R2 = A1.L + A1.H, R3= A0.L + A0.H ; -R4 = A1.L + A1.H, R5= A0.L + A0.H ; -R6 = A1.L + A1.H, R7= A0.L + A0.H ; - -/* forward byte order operands */ -//( Dreg, Dreg ) = BYTEOP16P ( Dreg_pair, Dreg_pair ) ; /* (b) */ -(r7,r0) = BYTEOP16P ( r3:2,r1:0 ) ; -(r1,r2) = byteop16p (r3:2,r1:0) ; -(r0,r1) = BYTEOP16P ( r3:2,r1:0 ) ; -(r2,r3) = byteop16p (r3:2,r1:0) ; -(r7,r0) = BYTEOP16P (r1:0, r3:2) ; -(r1,r2) = byteop16p (r1:0,r3:2) ; -(r0,r1) = BYTEOP16P (r1:0, r3:2) ; -(r2,r3) = byteop16p (r1:0,r3:2) ; - -/* reverse byte order operands */ -//( Dreg, Dreg ) = BYTEOP16P ( Dreg_pair, Dreg_pair ) (R); /* (b) */ -(r7,r0) = BYTEOP16P ( r3:2,r1:0 )(r) ; -(r1,r2) = byteop16p (r3:2,r1:0)(r) ; -(r0,r1) = BYTEOP16P ( r3:2,r1:0 )(r) ; -(r2,r3) = byteop16p (r3:2,r1:0)(r) ; -(r7,r0) = BYTEOP16P (r1:0, r3:2)(r) ; -(r1,r2) = byteop16p (r1:0,r3:2)(r) ; -(r0,r1) = BYTEOP16P (r1:0, r3:2)(r) ; -(r2,r3) = byteop16p (r1:0,r3:2)(r) ; - -/* forward byte order operands */ -//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) ; /* (b) */ -//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (T) ; /* truncated (b)*/ -/* reverse byte order operands */ -//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (R) ; /* (b) */ -//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (T, R) ; /* truncated (b) */ - -r3 = byteop1p (r1:0, r3:2) ; -r3 = byteop1p (r1:0, r3:2) (r) ; -r3 = byteop1p (r1:0, r3:2) (t) ; -r3 = byteop1p (r1:0, r3:2) (t,r) ; - -r0 = byteop1p (r3:2,r1:0); -r1 = byteop1p (r3:2,r1:0)(r) ; -r2 = byteop1p (r3:2,r1:0)(t) ; -r3 = byteop1p (r3:2,r1:0)(t,r) ; - -/* forward byte order operands */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDL) ; -/* round into low bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDH) ; -/* round into high bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TL) ; -/* truncate into low bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TH) ; -/* truncate into high bytes (b) */ -/* reverse byte order operands */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDL, R) ; -/* round into low bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDH, R) ; -/* round into high bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TL, R) ; -/* truncate into low bytes (b) */ -//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TH, R) ; -/* truncate into high bytes (b) */ - -r3 = byteop2p (r1:0, r3:2) (rndl) ; -r3 = byteop2p (r1:0, r3:2) (rndh) ; -r3 = byteop2p (r1:0, r3:2) (tl) ; -r3 = byteop2p (r1:0, r3:2) (th) ; -r3 = byteop2p (r1:0, r3:2) (rndl, r) ; -r3 = byteop2p (r1:0, r3:2) (rndh, r) ; -r3 = byteop2p (r1:0, r3:2) (tl, r) ; -r3 = byteop2p (r1:0, r3:2) (th, r) ; - -r0 = byteop2p (r1:0, r3:2) (rndl) ; -r1 = byteop2p (r1:0, r3:2) (rndh) ; -r2 = byteop2p (r1:0, r3:2) (tl) ; -r3 = byteop2p (r1:0, r3:2) (th) ; -r4 = byteop2p (r1:0, r3:2) (rndl, r) ; -r5 = byteop2p (r1:0, r3:2) (rndh, r) ; -r6 = byteop2p (r1:0, r3:2) (tl, r) ; -r7 = byteop2p (r1:0, r3:2) (th, r) ; - -r0 = byteop2p (r3:2, r3:2) (rndl) ; -r1 = byteop2p (r3:2, r3:2) (rndh) ; -r2 = byteop2p (r3:2, r3:2) (tl) ; -r3 = byteop2p (r3:2, r3:2) (th) ; -r4 = byteop2p (r3:2, r3:2) (rndl, r) ; -r5 = byteop2p (r3:2, r3:2) (rndh, r) ; -r6 = byteop2p (r3:2, r3:2) (tl, r) ; -r7 = byteop2p (r3:2, r3:2) (th, r) ; - -//Dreg = BYTEPACK ( Dreg, Dreg ) ; /* (b) */ -r0 = bytepack (r0,r0) ; -r1 = bytepack (r2,r3) ; -r4 = bytepack (r5,r6) ; -r7 = bytepack (r0,r1) ; -r2 = bytepack (r3,r4) ; -r5 = bytepack (r6,r7) ; - -/* forward byte order operands */ -//(Dreg, Dreg) = BYTEOP16M (Dreg_pair, Dreg_pair) ; /* (b */) -/* reverse byte order operands */ -//(Dreg, Dreg) = BYTEOP16M (Dreg-pair, Dreg-pair) (R) ; /* (b) */ - -(r1,r2)= byteop16m (r3:2,r1:0) ; -(r1,r2)= byteop16m (r3:2,r1:0) (r) ; -(r0,r1)= byteop16m (r3:2,r1:0) ; -(r2,r3)= byteop16m (r3:2,r1:0) (r) ; -(r3,r5)= byteop16m (r3:2,r1:0) ; -(r6,r7)= byteop16m (r3:2,r1:0) (r) ; - -(r1,r2)= byteop16m (r1:0,r1:0) ; -(r1,r2)= byteop16m (r1:0,r1:0) (r) ; -(r0,r1)= byteop16m (r1:0,r1:0) ; -(r2,r3)= byteop16m (r1:0,r1:0) (r) ; -(r3,r5)= byteop16m (r1:0,r1:0) ; -(r6,r7)= byteop16m (r1:0,r1:0) (r) ; - -(r1,r2)= byteop16m (r1:0,r3:2) ; -(r1,r2)= byteop16m (r1:0,r3:2) (r) ; -(r0,r1)= byteop16m (r1:0,r3:2) ; -(r2,r3)= byteop16m (r1:0,r3:2) (r) ; -(r3,r5)= byteop16m (r1:0,r3:2) ; -(r6,r7)= byteop16m (r1:0,r3:2) (r) ; - -(r1,r2)= byteop16m (r3:2,r3:2) ; -(r1,r2)= byteop16m (r3:2,r3:2) (r) ; -(r0,r1)= byteop16m (r3:2,r3:2) ; -(r2,r3)= byteop16m (r3:2,r3:2) (r) ; -(r3,r5)= byteop16m (r3:2,r3:2) ; -(r6,r7)= byteop16m (r3:2,r3:2) (r) ; - -//SAA (Dreg_pair, Dreg_pair) ; /* forward byte order operands (b) */ -//SAA (Dreg_pair, Dreg_pair) (R) ; /* reverse byte order operands (b) */ - -saa(r1:0, r3:2) || r0 = [i0++] || r2 = [i1++] ; /* parallel fill instructions */ -saa (r1:0, r3:2) (R) || r1 = [i0++] || r3 = [i1++] ; /* reverse, parallel fill instructions */ -saa (r1:0, r3:2) ; /* last SAA in a loop, no more fill required */ - -//( Dreg , Dreg ) = BYTEUNPACK Dreg_pair ; /* (b) */ -//( Dreg , Dreg ) = BYTEUNPACK Dreg_pair (R) ; /* reverse source order (b) */ - -(r6,r5) = byteunpack r1:0 ; /* non-reversing sources */ -(r6,r5) = byteunpack r1:0 (R) ; /* reversing sources case */ -(r6,r5) = byteunpack r3:2 ; /* non-reversing sources */ -(r6,r5) = byteunpack r3:2 (R) ; /* reversing sources case */ -(r0,r1) = byteunpack r1:0 ; /* non-reversing sources */ -(r2,r3) = byteunpack r1:0 (R) ; /* reversing sources case */ -(r4,r5) = byteunpack r3:2 ; /* non-reversing sources */ -(r6,r7) = byteunpack r3:2 (R) ; /* reversing sources case */ + +.EXTERN MY_LABEL2; +.section .text; + +// +//13 VIDEO PIXEL OPERATIONS +// + +//Dreg = ALIGN8 ( Dreg, Dreg ) ; /* overlay 1 byte (b) */ +R0 = ALIGN8(R0, R0); +R0 = ALIGN8(R0, R1); +R0 = ALIGN8(R1, R0); +R0 = ALIGN8(R1, R1); +R0 = ALIGN8(R1, R2); +R3 = ALIGN8(R4, R5); +R6 = ALIGN8(R7, R0); +R1 = ALIGN8(R2, R3); +R4 = ALIGN8(R5, R6); +R7 = ALIGN8(R0, R1); +R2 = ALIGN8(R3, R4); +R5 = ALIGN8(R6, R7); + +//Dreg = ALIGN16 ( Dreg, Dreg ) ; /* overlay 2 bytes (b) */ +R0 = ALIGN16(R0, R0); +R0 = ALIGN16(R0, R1); +R0 = ALIGN16(R1, R0); +R0 = ALIGN16(R1, R1); +R0 = ALIGN16(R1, R2); +R3 = ALIGN16(R4, R5); +R6 = ALIGN16(R7, R0); +R1 = ALIGN16(R2, R3); +R4 = ALIGN16(R5, R6); +R7 = ALIGN16(R0, R1); +R2 = ALIGN16(R3, R4); +R5 = ALIGN16(R6, R7); + +//Dreg = ALIGN24 ( Dreg, Dreg ) ; /* overlay 3 bytes (b) */ +R0 = ALIGN24(R0, R0); +R0 = ALIGN24(R0, R1); +R0 = ALIGN24(R1, R0); +R0 = ALIGN24(R1, R1); +R0 = ALIGN24(R1, R2); +R3 = ALIGN24(R4, R5); +R6 = ALIGN24(R7, R0); +R1 = ALIGN24(R2, R3); +R4 = ALIGN24(R5, R6); +R7 = ALIGN24(R0, R1); +R2 = ALIGN24(R3, R4); +R5 = ALIGN24(R6, R7); + +DISALGNEXCPT ; /* (b) */ + +/* forward byte order operands */ +//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (LO) ; /* sum into low bytes (b) */ +//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (HI) ; /* sum into high bytes (b) */ +/* reverse byte order operands */ +//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (LO, R) ; /* sum into low bytes (b) */ +//Dreg = BYTEOP3P (Dreg_pair, Dreg_pair) (HI, R) ; /* sum into high bytes (b) */ + +r0 = byteop3p (r1:0, r3:2) (lo) ; +r1 = byteop3p (r1:0, r3:2) (hi) ; +r2 = byteop3p (r1:0, r3:2) (lo, r) ; +r3 = byteop3p (r1:0, r3:2) (hi, r) ; +r4 = byteop3p (r3:2, r1:0) (lo) ; +r5 = byteop3p (r3:2, r1:0) (hi) ; +r6 = byteop3p (r3:2, r1:0) (lo, r) ; +r7 = byteop3p (r3:2, r1:0) (hi, r) ; + +//Dreg = A1.L + A1.H, Dreg = A0.L + A0.H ; /* (b) */ + +R0 = A1.L + A1.H, R0= A0.L + A0.H ; +R0 = A1.L + A1.H, R1= A0.L + A0.H ; +R2 = A1.L + A1.H, R3= A0.L + A0.H ; +R4 = A1.L + A1.H, R5= A0.L + A0.H ; +R6 = A1.L + A1.H, R7= A0.L + A0.H ; + +/* forward byte order operands */ +//( Dreg, Dreg ) = BYTEOP16P ( Dreg_pair, Dreg_pair ) ; /* (b) */ +(r7,r0) = BYTEOP16P ( r3:2,r1:0 ) ; +(r1,r2) = byteop16p (r3:2,r1:0) ; +(r0,r1) = BYTEOP16P ( r3:2,r1:0 ) ; +(r2,r3) = byteop16p (r3:2,r1:0) ; +(r7,r0) = BYTEOP16P (r1:0, r3:2) ; +(r1,r2) = byteop16p (r1:0,r3:2) ; +(r0,r1) = BYTEOP16P (r1:0, r3:2) ; +(r2,r3) = byteop16p (r1:0,r3:2) ; + +/* reverse byte order operands */ +//( Dreg, Dreg ) = BYTEOP16P ( Dreg_pair, Dreg_pair ) (R); /* (b) */ +(r7,r0) = BYTEOP16P ( r3:2,r1:0 )(r) ; +(r1,r2) = byteop16p (r3:2,r1:0)(r) ; +(r0,r1) = BYTEOP16P ( r3:2,r1:0 )(r) ; +(r2,r3) = byteop16p (r3:2,r1:0)(r) ; +(r7,r0) = BYTEOP16P (r1:0, r3:2)(r) ; +(r1,r2) = byteop16p (r1:0,r3:2)(r) ; +(r0,r1) = BYTEOP16P (r1:0, r3:2)(r) ; +(r2,r3) = byteop16p (r1:0,r3:2)(r) ; + +/* forward byte order operands */ +//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) ; /* (b) */ +//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (T) ; /* truncated (b)*/ +/* reverse byte order operands */ +//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (R) ; /* (b) */ +//Dreg = BYTEOP1P (Dreg_pair, Dreg_pair) (T, R) ; /* truncated (b) */ + +r3 = byteop1p (r1:0, r3:2) ; +r3 = byteop1p (r1:0, r3:2) (r) ; +r3 = byteop1p (r1:0, r3:2) (t) ; +r3 = byteop1p (r1:0, r3:2) (t,r) ; + +r0 = byteop1p (r3:2,r1:0); +r1 = byteop1p (r3:2,r1:0)(r) ; +r2 = byteop1p (r3:2,r1:0)(t) ; +r3 = byteop1p (r3:2,r1:0)(t,r) ; + +/* forward byte order operands */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDL) ; +/* round into low bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDH) ; +/* round into high bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TL) ; +/* truncate into low bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TH) ; +/* truncate into high bytes (b) */ +/* reverse byte order operands */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDL, R) ; +/* round into low bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (RNDH, R) ; +/* round into high bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TL, R) ; +/* truncate into low bytes (b) */ +//Dreg = BYTEOP2P (Dreg_pair, Dreg_pair) (TH, R) ; +/* truncate into high bytes (b) */ + +r3 = byteop2p (r1:0, r3:2) (rndl) ; +r3 = byteop2p (r1:0, r3:2) (rndh) ; +r3 = byteop2p (r1:0, r3:2) (tl) ; +r3 = byteop2p (r1:0, r3:2) (th) ; +r3 = byteop2p (r1:0, r3:2) (rndl, r) ; +r3 = byteop2p (r1:0, r3:2) (rndh, r) ; +r3 = byteop2p (r1:0, r3:2) (tl, r) ; +r3 = byteop2p (r1:0, r3:2) (th, r) ; + +r0 = byteop2p (r1:0, r3:2) (rndl) ; +r1 = byteop2p (r1:0, r3:2) (rndh) ; +r2 = byteop2p (r1:0, r3:2) (tl) ; +r3 = byteop2p (r1:0, r3:2) (th) ; +r4 = byteop2p (r1:0, r3:2) (rndl, r) ; +r5 = byteop2p (r1:0, r3:2) (rndh, r) ; +r6 = byteop2p (r1:0, r3:2) (tl, r) ; +r7 = byteop2p (r1:0, r3:2) (th, r) ; + +r0 = byteop2p (r3:2, r3:2) (rndl) ; +r1 = byteop2p (r3:2, r3:2) (rndh) ; +r2 = byteop2p (r3:2, r3:2) (tl) ; +r3 = byteop2p (r3:2, r3:2) (th) ; +r4 = byteop2p (r3:2, r3:2) (rndl, r) ; +r5 = byteop2p (r3:2, r3:2) (rndh, r) ; +r6 = byteop2p (r3:2, r3:2) (tl, r) ; +r7 = byteop2p (r3:2, r3:2) (th, r) ; + +//Dreg = BYTEPACK ( Dreg, Dreg ) ; /* (b) */ +r0 = bytepack (r0,r0) ; +r1 = bytepack (r2,r3) ; +r4 = bytepack (r5,r6) ; +r7 = bytepack (r0,r1) ; +r2 = bytepack (r3,r4) ; +r5 = bytepack (r6,r7) ; + +/* forward byte order operands */ +//(Dreg, Dreg) = BYTEOP16M (Dreg_pair, Dreg_pair) ; /* (b */) +/* reverse byte order operands */ +//(Dreg, Dreg) = BYTEOP16M (Dreg-pair, Dreg-pair) (R) ; /* (b) */ + +(r1,r2)= byteop16m (r3:2,r1:0) ; +(r1,r2)= byteop16m (r3:2,r1:0) (r) ; +(r0,r1)= byteop16m (r3:2,r1:0) ; +(r2,r3)= byteop16m (r3:2,r1:0) (r) ; +(r3,r5)= byteop16m (r3:2,r1:0) ; +(r6,r7)= byteop16m (r3:2,r1:0) (r) ; + +(r1,r2)= byteop16m (r1:0,r1:0) ; +(r1,r2)= byteop16m (r1:0,r1:0) (r) ; +(r0,r1)= byteop16m (r1:0,r1:0) ; +(r2,r3)= byteop16m (r1:0,r1:0) (r) ; +(r3,r5)= byteop16m (r1:0,r1:0) ; +(r6,r7)= byteop16m (r1:0,r1:0) (r) ; + +(r1,r2)= byteop16m (r1:0,r3:2) ; +(r1,r2)= byteop16m (r1:0,r3:2) (r) ; +(r0,r1)= byteop16m (r1:0,r3:2) ; +(r2,r3)= byteop16m (r1:0,r3:2) (r) ; +(r3,r5)= byteop16m (r1:0,r3:2) ; +(r6,r7)= byteop16m (r1:0,r3:2) (r) ; + +(r1,r2)= byteop16m (r3:2,r3:2) ; +(r1,r2)= byteop16m (r3:2,r3:2) (r) ; +(r0,r1)= byteop16m (r3:2,r3:2) ; +(r2,r3)= byteop16m (r3:2,r3:2) (r) ; +(r3,r5)= byteop16m (r3:2,r3:2) ; +(r6,r7)= byteop16m (r3:2,r3:2) (r) ; + +//SAA (Dreg_pair, Dreg_pair) ; /* forward byte order operands (b) */ +//SAA (Dreg_pair, Dreg_pair) (R) ; /* reverse byte order operands (b) */ + +saa(r1:0, r3:2) || r0 = [i0++] || r2 = [i1++] ; /* parallel fill instructions */ +saa (r1:0, r3:2) (R) || r1 = [i0++] || r3 = [i1++] ; /* reverse, parallel fill instructions */ +saa (r1:0, r3:2) ; /* last SAA in a loop, no more fill required */ + +//( Dreg , Dreg ) = BYTEUNPACK Dreg_pair ; /* (b) */ +//( Dreg , Dreg ) = BYTEUNPACK Dreg_pair (R) ; /* reverse source order (b) */ + +(r6,r5) = byteunpack r1:0 ; /* non-reversing sources */ +(r6,r5) = byteunpack r1:0 (R) ; /* reversing sources case */ +(r6,r5) = byteunpack r3:2 ; /* non-reversing sources */ +(r6,r5) = byteunpack r3:2 (R) ; /* reversing sources case */ +(r0,r1) = byteunpack r1:0 ; /* non-reversing sources */ +(r2,r3) = byteunpack r1:0 (R) ; /* reversing sources case */ +(r4,r5) = byteunpack r3:2 ; /* non-reversing sources */ +(r6,r7) = byteunpack r3:2 (R) ; /* reversing sources case */