2
* Automatically Tuned Linear Algebra Software v3.8.3
3
* (C) Copyright 2007 R. Clint Whaley
5
* Redistribution and use in source and binary forms, with or without
6
* modification, are permitted provided that the following conditions
8
* 1. Redistributions of source code must retain the above copyright
9
* notice, this list of conditions and the following disclaimer.
10
* 2. Redistributions in binary form must reproduce the above copyright
11
* notice, this list of conditions, and the following disclaimer in the
12
* documentation and/or other materials provided with the distribution.
13
* 3. The name of the ATLAS group or the names of its contributers may
14
* not be used to endorse or promote products derived from this
15
* software without specific written permission.
17
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
19
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
20
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE ATLAS GROUP OR ITS CONTRIBUTORS
21
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27
* POSSIBILITY OF SUCH DAMAGE.
32
#error "This kernel requires KB be a compile-time constant!"
35
#error "This kernel supports max KB of 80"
100
#define PFDISTA KB*8*8
102
#define prefA(mem) pref 6, mem
107
#define prefB(mem) pref 6, mem
112
#define prefC(mem) pref 5, mem
117
#define CMUL(i_) ((i_)+(i_))
123
* save : 18,19,20,21,22,23
124
* $26, $27 reserved. $0 = 0, $1 used by assembler
125
* I think can use $31 if I save it & restore it. r0 = 0
126
* Avail: $2, $3, $12-25, $28, $30, $31
131
(const int M, const int N, const int K, const double alpha, const double *A,
133
const int lda, const double *B, const int ldb, const double beta,
135
double *C, const int ldc)
148
* Adjust stack and save registers
150
daddiu $sp, $sp, -FSIZE
178
ldc1 rA0, FSIZE($sp) /* get BETA from caller's stack */
179
sdc1 rA0, 152($sp) /* save BETA to my stack */
183
* (ldc,lda, ldb, K0) * sizeof; setup column ptrs
187
ld incCn, FSIZE+16($sp)
190
lw incCn, FSIZE+16($sp)
193
sll incCn, incCn, 4 /* incCn = ldc*sizeof */
195
sll incCn, incCn, 3 /* incCn = ldc*sizeof */
197
sll incAm, incAm, 3 /* incAm = lda*sizeof */
199
dmul incAn, incAm, M /* incAn = lda*M */
200
sll incBn, incBn, 3 /* incBn = ldb*sizeof */
201
dmul stBn, incBn, N /* stBn = ldb*N */
204
daddu pA1, pA0, incAm
205
daddu pA2, pA1, incAm
206
daddu pA3, pA2, incAm
207
daddu pB1, pB0, incBn
208
daddu pB2, pB1, incBn
209
daddu pB3, pB2, incBn
210
daddu pC1, pC0, incCn
211
daddu pC2, pC1, incCn
212
daddu pC3, pC2, incCn
213
sll incAm, incAm, 2 /* incAm = lda*4 */
214
sll incBn, incBn, 2 /* incBn = ldb*4 */
215
daddu stAm, pA0, incAn /* stAm = pA0 + lda*M */
216
daddu stBn, pB0, stBn /* stBn = pB0 + ldb*N */
218
sll pfA, M, 4 /* pfA = M*sizeof */
220
sll pfA, M, 3 /* pfA = M*sizeof */
222
sll incCn, incCn, 2 /* incCn = ldc*4 */
223
dsubu incCn, incCn, pfA /* incCn = ldc*4 - M */
242
ldc1 rC10, CMUL(8)(pC0)
243
ldc1 rC20, CMUL(16)(pC0)
244
ldc1 rC30, CMUL(24)(pC0)
245
ldc1 rC11, CMUL(8)(pC1)
246
ldc1 rC21, CMUL(16)(pC1)
247
ldc1 rC31, CMUL(24)(pC1)
250
ldc1 rC12, CMUL(8)(pC2)
251
ldc1 rC22, CMUL(16)(pC2)
252
ldc1 rC32, CMUL(24)(pC2)
254
ldc1 rC13, CMUL(8)(pC3)
255
ldc1 rC23, CMUL(16)(pC3)
256
ldc1 rC33, CMUL(24)(pC3)
259
ldc1 rB3, BETOFF($sp) /* load BETA */
261
ldc1 rC10, CMUL(8)(pC0)
262
ldc1 rC20, CMUL(16)(pC0)
263
ldc1 rC30, CMUL(24)(pC0)
265
mul.d rC00, rC00, rB3
266
ldc1 rC11, CMUL(8)(pC1)
267
mul.d rC10, rC10, rB3
268
ldc1 rC21, CMUL(16)(pC1)
269
mul.d rC20, rC20, rB3
270
ldc1 rC31, CMUL(24)(pC1)
271
mul.d rC30, rC30, rB3
273
mul.d rC01, rC01, rB3
274
ldc1 rC12, CMUL(8)(pC2)
275
mul.d rC11, rC11, rB3
276
ldc1 rC22, CMUL(16)(pC2)
277
mul.d rC21, rC21, rB3
278
ldc1 rC32, CMUL(24)(pC2)
279
mul.d rC31, rC31, rB3
281
mul.d rC02, rC02, rB3
282
ldc1 rC13, CMUL(8)(pC3)
283
mul.d rC12, rC12, rB3
284
ldc1 rC23, CMUL(16)(pC3)
285
mul.d rC22, rC22, rB3
286
ldc1 rC33, CMUL(24)(pC3)
287
mul.d rC32, rC32, rB3
288
mul.d rC03, rC03, rB3
289
mul.d rC13, rC13, rB3
290
mul.d rC23, rC23, rB3
291
mul.d rC33, rC33, rB3
294
#if KB <= 2 && defined(BETA0)
350
madd.d rC00, rC00, rA0, rB0
352
madd.d rC10, rC10, rA1, rB0
353
madd.d rC20, rC20, rA2, rB0
355
ldc1 rC13, CMUL(8)(pC3)
357
madd.d rC30, rC30, rA3, rB0
359
ldc1 rC23, CMUL(16)(pC3)
361
madd.d rC01, rC01, rA0, rB1
363
ldc1 rC33, CMUL(24)(pC3)
365
madd.d rC11, rC11, rA1, rB1
367
madd.d rC21, rC21, rA2, rB1
369
madd.d rC31, rC31, rA3, rB1
371
madd.d rC02, rC02, rA0, rB2
373
madd.d rC12, rC12, rA1, rB2
375
madd.d rC22, rC22, rA2, rB2
377
madd.d rC32, rC32, rA3, rB2
379
madd.d rC03, rC03, rA0, rB3
381
madd.d rC13, rC13, rA1, rB3
383
madd.d rC23, rC23, rA2, rB3
385
madd.d rC33, rC33, rA3, rB3
386
#endif /* if BETA != 0 */
388
madd.d rC00, rC00, ra0, rb0
390
madd.d rC10, rC10, ra1, rb0
392
madd.d rC20, rC20, ra2, rb0
394
madd.d rC30, rC30, ra3, rb0
396
madd.d rC01, rC01, ra0, rb1
398
madd.d rC11, rC11, ra1, rb1
400
madd.d rC21, rC21, ra2, rb1
402
madd.d rC31, rC31, ra3, rb1
403
prefA(32+KB*8*8(pA0))
404
madd.d rC02, rC02, ra0, rb2
405
prefA(32+KB*8*8(pA1))
406
madd.d rC12, rC12, ra1, rb2
407
prefA(32+KB*8*8(pA2))
408
madd.d rC22, rC22, ra2, rb2
409
prefA(32+KB*8*8(pA3))
410
madd.d rC32, rC32, ra3, rb2
411
prefA(64+KB*8*8(pA0))
412
madd.d rC03, rC03, ra0, rb3
413
prefA(64+KB*8*8(pA1))
414
madd.d rC13, rC13, ra1, rb3
415
prefA(64+KB*8*8(pA2))
416
madd.d rC23, rC23, ra2, rb3
417
prefA(64+KB*8*8(pA3))
418
madd.d rC33, rC33, ra3, rb3
422
madd.d rC00, rC00, rA0, rB0
424
madd.d rC10, rC10, rA1, rB0
426
madd.d rC20, rC20, rA2, rB0
428
madd.d rC30, rC30, rA3, rB0
430
madd.d rC01, rC01, rA0, rB1
432
madd.d rC11, rC11, rA1, rB1
434
madd.d rC21, rC21, rA2, rB1
436
madd.d rC31, rC31, rA3, rB1
437
prefA(96+KB*8*8(pA0))
438
madd.d rC02, rC02, rA0, rB2
439
prefA(96+KB*8*8(pA1))
440
madd.d rC12, rC12, rA1, rB2
441
prefA(96+KB*8*8(pA2))
442
madd.d rC22, rC22, rA2, rB2
443
prefA(96+KB*8*8(pA3))
444
madd.d rC32, rC32, rA3, rB2
445
prefA(128+KB*8*8(pA0))
446
madd.d rC03, rC03, rA0, rB3
447
prefA(128+KB*8*8(pA1))
448
madd.d rC13, rC13, rA1, rB3
449
prefA(128+KB*8*8(pA2))
450
madd.d rC23, rC23, rA2, rB3
451
prefA(128+KB*8*8(pA3))
452
madd.d rC33, rC33, rA3, rB3
454
madd.d rC00, rC00, ra0, rb0
456
madd.d rC10, rC10, ra1, rb0
458
madd.d rC20, rC20, ra2, rb0
460
madd.d rC30, rC30, ra3, rb0
462
madd.d rC01, rC01, ra0, rb1
464
madd.d rC11, rC11, ra1, rb1
466
madd.d rC21, rC21, ra2, rb1
468
madd.d rC31, rC31, ra3, rb1
469
madd.d rC02, rC02, ra0, rb2
470
madd.d rC12, rC12, ra1, rb2
471
madd.d rC22, rC22, ra2, rb2
472
madd.d rC32, rC32, ra3, rb2
473
madd.d rC03, rC03, ra0, rb3
474
madd.d rC13, rC13, ra1, rb3
475
madd.d rC23, rC23, ra2, rb3
476
madd.d rC33, rC33, ra3, rb3
480
madd.d rC00, rC00, rA0, rB0
482
madd.d rC10, rC10, rA1, rB0
484
madd.d rC20, rC20, rA2, rB0
486
madd.d rC30, rC30, rA3, rB0
488
madd.d rC01, rC01, rA0, rB1
490
madd.d rC11, rC11, rA1, rB1
492
madd.d rC21, rC21, rA2, rB1
494
madd.d rC31, rC31, rA3, rB1
495
madd.d rC02, rC02, rA0, rB2
496
madd.d rC12, rC12, rA1, rB2
497
madd.d rC22, rC22, rA2, rB2
498
madd.d rC32, rC32, rA3, rB2
499
madd.d rC03, rC03, rA0, rB3
500
madd.d rC13, rC13, rA1, rB3
501
madd.d rC23, rC23, rA2, rB3
502
madd.d rC33, rC33, rA3, rB3
504
madd.d rC00, rC00, ra0, rb0
506
madd.d rC10, rC10, ra1, rb0
508
madd.d rC20, rC20, ra2, rb0
510
madd.d rC30, rC30, ra3, rb0
512
madd.d rC01, rC01, ra0, rb1
514
madd.d rC11, rC11, ra1, rb1
516
madd.d rC21, rC21, ra2, rb1
518
madd.d rC31, rC31, ra3, rb1
519
madd.d rC02, rC02, ra0, rb2
520
prefA(192+KB*8*8(pA0))
521
madd.d rC12, rC12, ra1, rb2
522
prefA(192+KB*8*8(pA1))
523
madd.d rC22, rC22, ra2, rb2
524
prefA(192+KB*8*8(pA2))
525
madd.d rC32, rC32, ra3, rb2
526
prefA(192+KB*8*8(pA3))
527
madd.d rC03, rC03, ra0, rb3
528
madd.d rC13, rC13, ra1, rb3
529
madd.d rC23, rC23, ra2, rb3
530
madd.d rC33, rC33, ra3, rb3
534
madd.d rC00, rC00, rA0, rB0
536
madd.d rC10, rC10, rA1, rB0
538
madd.d rC20, rC20, rA2, rB0
540
madd.d rC30, rC30, rA3, rB0
542
madd.d rC01, rC01, rA0, rB1
544
madd.d rC11, rC11, rA1, rB1
546
madd.d rC21, rC21, rA2, rB1
548
madd.d rC31, rC31, rA3, rB1
549
madd.d rC02, rC02, rA0, rB2
550
madd.d rC12, rC12, rA1, rB2
551
madd.d rC22, rC22, rA2, rB2
552
madd.d rC32, rC32, rA3, rB2
553
madd.d rC03, rC03, rA0, rB3
554
madd.d rC13, rC13, rA1, rB3
555
madd.d rC23, rC23, rA2, rB3
556
madd.d rC33, rC33, rA3, rB3
558
madd.d rC00, rC00, ra0, rb0
560
madd.d rC10, rC10, ra1, rb0
562
madd.d rC20, rC20, ra2, rb0
564
madd.d rC30, rC30, ra3, rb0
566
madd.d rC01, rC01, ra0, rb1
568
madd.d rC11, rC11, ra1, rb1
570
madd.d rC21, rC21, ra2, rb1
572
madd.d rC31, rC31, ra3, rb1
573
madd.d rC02, rC02, ra0, rb2
574
madd.d rC12, rC12, ra1, rb2
575
madd.d rC22, rC22, ra2, rb2
576
prefA(256+KB*8*8(pA0))
577
madd.d rC32, rC32, ra3, rb2
578
prefA(256+KB*8*8(pA1))
579
madd.d rC03, rC03, ra0, rb3
580
prefA(256+KB*8*8(pA2))
581
madd.d rC13, rC13, ra1, rb3
582
prefA(256+KB*8*8(pA3))
583
madd.d rC23, rC23, ra2, rb3
584
madd.d rC33, rC33, ra3, rb3
588
madd.d rC00, rC00, rA0, rB0
590
madd.d rC10, rC10, rA1, rB0
592
madd.d rC20, rC20, rA2, rB0
594
madd.d rC30, rC30, rA3, rB0
596
madd.d rC01, rC01, rA0, rB1
598
madd.d rC11, rC11, rA1, rB1
600
madd.d rC21, rC21, rA2, rB1
602
madd.d rC31, rC31, rA3, rB1
603
madd.d rC02, rC02, rA0, rB2
604
madd.d rC12, rC12, rA1, rB2
605
madd.d rC22, rC22, rA2, rB2
606
madd.d rC32, rC32, rA3, rB2
607
madd.d rC03, rC03, rA0, rB3
608
madd.d rC13, rC13, rA1, rB3
609
madd.d rC23, rC23, rA2, rB3
610
madd.d rC33, rC33, rA3, rB3
612
madd.d rC00, rC00, ra0, rb0
614
madd.d rC10, rC10, ra1, rb0
616
madd.d rC20, rC20, ra2, rb0
618
madd.d rC30, rC30, ra3, rb0
620
madd.d rC01, rC01, ra0, rb1
622
madd.d rC11, rC11, ra1, rb1
624
madd.d rC21, rC21, ra2, rb1
626
madd.d rC31, rC31, ra3, rb1
627
madd.d rC02, rC02, ra0, rb2
628
madd.d rC12, rC12, ra1, rb2
629
madd.d rC22, rC22, ra2, rb2
630
madd.d rC32, rC32, ra3, rb2
631
madd.d rC03, rC03, ra0, rb3
632
madd.d rC13, rC13, ra1, rb3
633
madd.d rC23, rC23, ra2, rb3
634
madd.d rC33, rC33, ra3, rb3
638
madd.d rC00, rC00, rA0, rB0
640
madd.d rC10, rC10, rA1, rB0
642
madd.d rC20, rC20, rA2, rB0
644
madd.d rC30, rC30, rA3, rB0
646
madd.d rC01, rC01, rA0, rB1
648
madd.d rC11, rC11, rA1, rB1
650
madd.d rC21, rC21, rA2, rB1
652
madd.d rC31, rC31, rA3, rB1
653
madd.d rC02, rC02, rA0, rB2
654
prefA(320+KB*8*8(pA0))
655
madd.d rC12, rC12, rA1, rB2
656
madd.d rC22, rC22, rA2, rB2
657
prefA(320+KB*8*8(pA1))
658
madd.d rC32, rC32, rA3, rB2
659
madd.d rC03, rC03, rA0, rB3
660
prefA(320+KB*8*8(pA2))
661
madd.d rC13, rC13, rA1, rB3
662
madd.d rC23, rC23, rA2, rB3
663
prefA(320+KB*8*8(pA3))
664
madd.d rC33, rC33, rA3, rB3
666
madd.d rC00, rC00, ra0, rb0
668
madd.d rC10, rC10, ra1, rb0
670
madd.d rC20, rC20, ra2, rb0
672
madd.d rC30, rC30, ra3, rb0
674
madd.d rC01, rC01, ra0, rb1
676
madd.d rC11, rC11, ra1, rb1
678
madd.d rC21, rC21, ra2, rb1
680
madd.d rC31, rC31, ra3, rb1
681
madd.d rC02, rC02, ra0, rb2
682
madd.d rC12, rC12, ra1, rb2
683
madd.d rC22, rC22, ra2, rb2
684
madd.d rC32, rC32, ra3, rb2
685
madd.d rC03, rC03, ra0, rb3
686
madd.d rC13, rC13, ra1, rb3
687
madd.d rC23, rC23, ra2, rb3
688
madd.d rC33, rC33, ra3, rb3
692
madd.d rC00, rC00, rA0, rB0
694
madd.d rC10, rC10, rA1, rB0
696
madd.d rC20, rC20, rA2, rB0
698
madd.d rC30, rC30, rA3, rB0
700
madd.d rC01, rC01, rA0, rB1
702
madd.d rC11, rC11, rA1, rB1
704
madd.d rC21, rC21, rA2, rB1
706
madd.d rC31, rC31, rA3, rB1
707
madd.d rC02, rC02, rA0, rB2
708
madd.d rC12, rC12, rA1, rB2
709
madd.d rC22, rC22, rA2, rB2
710
madd.d rC32, rC32, rA3, rB2
711
madd.d rC03, rC03, rA0, rB3
712
madd.d rC13, rC13, rA1, rB3
713
madd.d rC23, rC23, rA2, rB3
714
madd.d rC33, rC33, rA3, rB3
716
madd.d rC00, rC00, ra0, rb0
718
madd.d rC10, rC10, ra1, rb0
720
madd.d rC20, rC20, ra2, rb0
722
madd.d rC30, rC30, ra3, rb0
724
madd.d rC01, rC01, ra0, rb1
726
madd.d rC11, rC11, ra1, rb1
728
madd.d rC21, rC21, ra2, rb1
730
madd.d rC31, rC31, ra3, rb1
731
madd.d rC02, rC02, ra0, rb2
732
prefA(352+KB*8*8(pA0))
733
madd.d rC12, rC12, ra1, rb2
734
prefA(352+KB*8*8(pA1))
735
madd.d rC22, rC22, ra2, rb2
736
madd.d rC32, rC32, ra3, rb2
737
prefA(352+KB*8*8(pA2))
738
madd.d rC03, rC03, ra0, rb3
739
madd.d rC13, rC13, ra1, rb3
740
prefA(352+KB*8*8(pA3))
741
madd.d rC23, rC23, ra2, rb3
742
madd.d rC33, rC33, ra3, rb3
746
madd.d rC00, rC00, rA0, rB0
748
madd.d rC10, rC10, rA1, rB0
750
madd.d rC20, rC20, rA2, rB0
752
madd.d rC30, rC30, rA3, rB0
754
madd.d rC01, rC01, rA0, rB1
756
madd.d rC11, rC11, rA1, rB1
758
madd.d rC21, rC21, rA2, rB1
760
madd.d rC31, rC31, rA3, rB1
761
madd.d rC02, rC02, rA0, rB2
762
madd.d rC12, rC12, rA1, rB2
763
madd.d rC22, rC22, rA2, rB2
764
madd.d rC32, rC32, rA3, rB2
765
madd.d rC03, rC03, rA0, rB3
766
madd.d rC13, rC13, rA1, rB3
767
madd.d rC23, rC23, rA2, rB3
768
madd.d rC33, rC33, rA3, rB3
770
madd.d rC00, rC00, ra0, rb0
772
madd.d rC10, rC10, ra1, rb0
774
madd.d rC20, rC20, ra2, rb0
776
madd.d rC30, rC30, ra3, rb0
778
madd.d rC01, rC01, ra0, rb1
780
madd.d rC11, rC11, ra1, rb1
782
madd.d rC21, rC21, ra2, rb1
784
madd.d rC31, rC31, ra3, rb1
785
madd.d rC02, rC02, ra0, rb2
786
madd.d rC12, rC12, ra1, rb2
787
madd.d rC22, rC22, ra2, rb2
789
madd.d rC32, rC32, ra3, rb2
791
madd.d rC03, rC03, ra0, rb3
793
madd.d rC13, rC13, ra1, rb3
795
madd.d rC23, rC23, ra2, rb3
796
madd.d rC33, rC33, ra3, rb3
800
madd.d rC00, rC00, rA0, rB0
802
madd.d rC10, rC10, rA1, rB0
804
madd.d rC20, rC20, rA2, rB0
806
madd.d rC30, rC30, rA3, rB0
808
madd.d rC01, rC01, rA0, rB1
810
madd.d rC11, rC11, rA1, rB1
812
madd.d rC21, rC21, rA2, rB1
814
madd.d rC31, rC31, rA3, rB1
815
madd.d rC02, rC02, rA0, rB2
816
madd.d rC12, rC12, rA1, rB2
817
madd.d rC22, rC22, rA2, rB2
818
prefB(32+KB*8*4(pB0))
819
madd.d rC32, rC32, rA3, rB2
820
prefB(32+KB*8*4(pB1))
821
madd.d rC03, rC03, rA0, rB3
822
prefB(32+KB*8*4(pB2))
823
madd.d rC13, rC13, rA1, rB3
824
prefB(32+KB*8*4(pB3))
825
madd.d rC23, rC23, rA2, rB3
826
madd.d rC33, rC33, rA3, rB3
828
madd.d rC00, rC00, ra0, rb0
830
madd.d rC10, rC10, ra1, rb0
832
madd.d rC20, rC20, ra2, rb0
834
madd.d rC30, rC30, ra3, rb0
836
madd.d rC01, rC01, ra0, rb1
838
madd.d rC11, rC11, ra1, rb1
840
madd.d rC21, rC21, ra2, rb1
842
madd.d rC31, rC31, ra3, rb1
843
madd.d rC02, rC02, ra0, rb2
844
madd.d rC12, rC12, ra1, rb2
845
madd.d rC22, rC22, ra2, rb2
846
prefB(64+KB*8*4(pB0))
847
madd.d rC32, rC32, ra3, rb2
848
prefB(64+KB*8*4(pB1))
849
madd.d rC03, rC03, ra0, rb3
850
prefB(64+KB*8*4(pB2))
851
madd.d rC13, rC13, ra1, rb3
852
prefB(64+KB*8*4(pB3))
853
madd.d rC23, rC23, ra2, rb3
854
madd.d rC33, rC33, ra3, rb3
858
madd.d rC00, rC00, rA0, rB0
860
madd.d rC10, rC10, rA1, rB0
862
madd.d rC20, rC20, rA2, rB0
864
madd.d rC30, rC30, rA3, rB0
866
madd.d rC01, rC01, rA0, rB1
868
madd.d rC11, rC11, rA1, rB1
870
madd.d rC21, rC21, rA2, rB1
872
madd.d rC31, rC31, rA3, rB1
873
madd.d rC02, rC02, rA0, rB2
874
madd.d rC12, rC12, rA1, rB2
875
madd.d rC22, rC22, rA2, rB2
876
prefB(96+KB*8*4(pB0))
877
madd.d rC32, rC32, rA3, rB2
878
prefB(96+KB*8*4(pB1))
879
madd.d rC03, rC03, rA0, rB3
880
prefB(96+KB*8*4(pB2))
881
madd.d rC13, rC13, rA1, rB3
882
prefB(96+KB*8*4(pB3))
883
madd.d rC23, rC23, rA2, rB3
884
madd.d rC33, rC33, rA3, rB3
886
madd.d rC00, rC00, ra0, rb0
888
madd.d rC10, rC10, ra1, rb0
890
madd.d rC20, rC20, ra2, rb0
892
madd.d rC30, rC30, ra3, rb0
894
madd.d rC01, rC01, ra0, rb1
896
madd.d rC11, rC11, ra1, rb1
898
madd.d rC21, rC21, ra2, rb1
900
madd.d rC31, rC31, ra3, rb1
901
madd.d rC02, rC02, ra0, rb2
902
madd.d rC12, rC12, ra1, rb2
903
madd.d rC22, rC22, ra2, rb2
904
prefB(128+KB*8*4(pB0))
905
madd.d rC32, rC32, ra3, rb2
906
prefB(128+KB*8*4(pB1))
907
madd.d rC03, rC03, ra0, rb3
908
prefB(128+KB*8*4(pB2))
909
madd.d rC13, rC13, ra1, rb3
910
prefB(128+KB*8*4(pB3))
911
madd.d rC23, rC23, ra2, rb3
912
madd.d rC33, rC33, ra3, rb3
916
madd.d rC00, rC00, rA0, rB0
918
madd.d rC10, rC10, rA1, rB0
920
madd.d rC20, rC20, rA2, rB0
922
madd.d rC30, rC30, rA3, rB0
924
madd.d rC01, rC01, rA0, rB1
926
madd.d rC11, rC11, rA1, rB1
928
madd.d rC21, rC21, rA2, rB1
930
madd.d rC31, rC31, rA3, rB1
931
madd.d rC02, rC02, rA0, rB2
932
prefB(160+KB*8*4(pB0))
933
madd.d rC12, rC12, rA1, rB2
934
prefB(160+KB*8*4(pB1))
935
madd.d rC22, rC22, rA2, rB2
936
prefB(160+KB*8*4(pB2))
937
madd.d rC32, rC32, rA3, rB2
938
prefB(160+KB*8*4(pB3))
939
madd.d rC03, rC03, rA0, rB3
940
madd.d rC13, rC13, rA1, rB3
941
madd.d rC23, rC23, rA2, rB3
942
madd.d rC33, rC33, rA3, rB3
944
madd.d rC00, rC00, ra0, rb0
946
madd.d rC10, rC10, ra1, rb0
948
madd.d rC20, rC20, ra2, rb0
950
madd.d rC30, rC30, ra3, rb0
952
madd.d rC01, rC01, ra0, rb1
954
madd.d rC11, rC11, ra1, rb1
956
madd.d rC21, rC21, ra2, rb1
958
madd.d rC31, rC31, ra3, rb1
959
madd.d rC02, rC02, ra0, rb2
960
madd.d rC12, rC12, ra1, rb2
961
madd.d rC22, rC22, ra2, rb2
962
prefB(192+KB*8*4(pB0))
963
madd.d rC32, rC32, ra3, rb2
964
prefB(192+KB*8*4(pB1))
965
madd.d rC03, rC03, ra0, rb3
966
prefB(192+KB*8*4(pB2))
967
madd.d rC13, rC13, ra1, rb3
968
prefB(192+KB*8*4(pB3))
969
madd.d rC23, rC23, ra2, rb3
970
madd.d rC33, rC33, ra3, rb3
974
madd.d rC00, rC00, rA0, rB0
976
madd.d rC10, rC10, rA1, rB0
978
madd.d rC20, rC20, rA2, rB0
980
madd.d rC30, rC30, rA3, rB0
982
madd.d rC01, rC01, rA0, rB1
984
madd.d rC11, rC11, rA1, rB1
986
madd.d rC21, rC21, rA2, rB1
988
madd.d rC31, rC31, rA3, rB1
989
madd.d rC02, rC02, rA0, rB2
990
madd.d rC12, rC12, rA1, rB2
991
madd.d rC22, rC22, rA2, rB2
992
prefB(224+KB*8*4(pB0))
993
madd.d rC32, rC32, rA3, rB2
994
prefB(224+KB*8*4(pB1))
995
madd.d rC03, rC03, rA0, rB3
996
prefB(224+KB*8*4(pB2))
997
madd.d rC13, rC13, rA1, rB3
998
prefB(224+KB*8*4(pB3))
1003
madd.d rC23, rC23, rA2, rB3
1004
madd.d rC33, rC33, rA3, rB3
1006
madd.d rC00, rC00, ra0, rb0
1008
madd.d rC10, rC10, ra1, rb0
1010
madd.d rC20, rC20, ra2, rb0
1012
madd.d rC30, rC30, ra3, rb0
1014
madd.d rC01, rC01, ra0, rb1
1016
madd.d rC11, rC11, ra1, rb1
1018
madd.d rC21, rC21, ra2, rb1
1020
madd.d rC31, rC31, ra3, rb1
1021
prefB(256+KB*8*4(pB0))
1022
madd.d rC02, rC02, ra0, rb2
1023
prefB(256+KB*8*4(pB1))
1024
madd.d rC12, rC12, ra1, rb2
1025
prefB(256+KB*8*4(pB2))
1026
madd.d rC22, rC22, ra2, rb2
1027
prefB(256+KB*8*4(pB3))
1032
madd.d rC32, rC32, ra3, rb2
1033
prefB(288+KB*8*4(pB0))
1034
madd.d rC03, rC03, ra0, rb3
1035
prefB(288+KB*8*4(pB1))
1036
madd.d rC13, rC13, ra1, rb3
1037
prefB(288+KB*8*4(pB2))
1038
madd.d rC23, rC23, ra2, rb3
1039
prefB(288+KB*8*4(pB3))
1044
madd.d rC33, rC33, ra3, rb3
1048
madd.d rC00, rC00, rA0, rB0
1050
madd.d rC10, rC10, rA1, rB0
1052
madd.d rC20, rC20, rA2, rB0
1054
madd.d rC30, rC30, rA3, rB0
1056
madd.d rC01, rC01, rA0, rB1
1058
madd.d rC11, rC11, rA1, rB1
1060
madd.d rC21, rC21, rA2, rB1
1062
madd.d rC31, rC31, rA3, rB1
1063
madd.d rC02, rC02, rA0, rB2
1064
madd.d rC12, rC12, rA1, rB2
1065
madd.d rC22, rC22, rA2, rB2
1066
prefB(320+KB*8*4(pB0))
1067
madd.d rC32, rC32, rA3, rB2
1068
prefB(320+KB*8*4(pB1))
1069
madd.d rC03, rC03, rA0, rB3
1070
prefB(320+KB*8*4(pB2))
1071
madd.d rC13, rC13, rA1, rB3
1072
prefB(320+KB*8*4(pB3))
1077
madd.d rC23, rC23, rA2, rB3
1078
madd.d rC33, rC33, rA3, rB3
1080
madd.d rC00, rC00, ra0, rb0
1082
madd.d rC10, rC10, ra1, rb0
1084
madd.d rC20, rC20, ra2, rb0
1086
madd.d rC30, rC30, ra3, rb0
1088
madd.d rC01, rC01, ra0, rb1
1090
madd.d rC11, rC11, ra1, rb1
1092
madd.d rC21, rC21, ra2, rb1
1094
madd.d rC31, rC31, ra3, rb1
1095
prefC(CMUL(32)(pC0))
1096
madd.d rC02, rC02, ra0, rb2
1097
prefC(CMUL(32)(pC1))
1098
madd.d rC12, rC12, ra1, rb2
1099
prefC(CMUL(32)(pC2))
1100
madd.d rC22, rC22, ra2, rb2
1101
prefC(CMUL(32)(pC3))
1102
madd.d rC32, rC32, ra3, rb2
1103
madd.d rC03, rC03, ra0, rb3
1104
madd.d rC13, rC13, ra1, rb3
1105
madd.d rC23, rC23, ra2, rb3
1106
madd.d rC33, rC33, ra3, rb3
1110
madd.d rC00, rC00, rA0, rB0
1112
madd.d rC10, rC10, rA1, rB0
1114
madd.d rC20, rC20, rA2, rB0
1116
madd.d rC30, rC30, rA3, rB0
1118
madd.d rC01, rC01, rA0, rB1
1120
madd.d rC11, rC11, rA1, rB1
1122
madd.d rC21, rC21, rA2, rB1
1124
madd.d rC31, rC31, rA3, rB1
1125
madd.d rC02, rC02, rA0, rB2
1126
madd.d rC12, rC12, rA1, rB2
1127
madd.d rC22, rC22, rA2, rB2
1128
prefB(352+KB*8*4(pB0))
1129
madd.d rC32, rC32, rA3, rB2
1130
prefB(352+KB*8*4(pB1))
1131
madd.d rC03, rC03, rA0, rB3
1132
prefB(352+KB*8*4(pB2))
1133
madd.d rC13, rC13, rA1, rB3
1134
prefB(352+KB*8*4(pB3))
1139
madd.d rC23, rC23, rA2, rB3
1140
madd.d rC33, rC33, rA3, rB3
1142
madd.d rC00, rC00, ra0, rb0
1144
madd.d rC10, rC10, ra1, rb0
1146
madd.d rC20, rC20, ra2, rb0
1148
madd.d rC30, rC30, ra3, rb0
1150
madd.d rC01, rC01, ra0, rb1
1152
madd.d rC11, rC11, ra1, rb1
1154
madd.d rC21, rC21, ra2, rb1
1156
madd.d rC31, rC31, ra3, rb1
1157
madd.d rC02, rC02, ra0, rb2
1158
madd.d rC12, rC12, ra1, rb2
1159
madd.d rC22, rC22, ra2, rb2
1160
prefB(384+KB*8*4(pB0))
1161
madd.d rC32, rC32, ra3, rb2
1162
prefB(384+KB*8*4(pB1))
1163
madd.d rC03, rC03, ra0, rb3
1164
prefB(384+KB*8*4(pB2))
1165
madd.d rC13, rC13, ra1, rb3
1166
prefB(384+KB*8*4(pB3))
1171
madd.d rC23, rC23, ra2, rb3
1172
madd.d rC33, rC33, ra3, rb3
1176
madd.d rC00, rC00, rA0, rB0
1178
madd.d rC10, rC10, rA1, rB0
1180
madd.d rC20, rC20, rA2, rB0
1182
madd.d rC30, rC30, rA3, rB0
1184
madd.d rC01, rC01, rA0, rB1
1186
madd.d rC11, rC11, rA1, rB1
1188
madd.d rC21, rC21, rA2, rB1
1190
madd.d rC31, rC31, rA3, rB1
1191
madd.d rC02, rC02, rA0, rB2
1192
madd.d rC12, rC12, rA1, rB2
1193
madd.d rC22, rC22, rA2, rB2
1194
madd.d rC32, rC32, rA3, rB2
1195
madd.d rC03, rC03, rA0, rB3
1196
madd.d rC13, rC13, rA1, rB3
1197
madd.d rC23, rC23, rA2, rB3
1198
madd.d rC33, rC33, rA3, rB3
1200
madd.d rC00, rC00, ra0, rb0
1202
madd.d rC10, rC10, ra1, rb0
1204
madd.d rC20, rC20, ra2, rb0
1206
madd.d rC30, rC30, ra3, rb0
1208
madd.d rC01, rC01, ra0, rb1
1210
madd.d rC11, rC11, ra1, rb1
1212
madd.d rC21, rC21, ra2, rb1
1214
madd.d rC31, rC31, ra3, rb1
1215
prefB(416+KB*8*4(pB0))
1216
madd.d rC02, rC02, ra0, rb2
1217
prefB(416+KB*8*4(pB1))
1218
madd.d rC12, rC12, ra1, rb2
1219
prefB(416+KB*8*4(pB2))
1220
madd.d rC22, rC22, ra2, rb2
1221
prefB(416+KB*8*4(pB3))
1226
madd.d rC32, rC32, ra3, rb2
1227
prefB(448+KB*8*4(pB0))
1228
madd.d rC03, rC03, ra0, rb3
1229
prefB(448+KB*8*4(pB1))
1230
madd.d rC13, rC13, ra1, rb3
1231
prefB(448+KB*8*4(pB2))
1232
madd.d rC23, rC23, ra2, rb3
1233
prefB(448+KB*8*4(pB3))
1234
madd.d rC33, rC33, ra3, rb3
1238
madd.d rC00, rC00, rA0, rB0
1240
madd.d rC10, rC10, rA1, rB0
1242
madd.d rC20, rC20, rA2, rB0
1244
madd.d rC30, rC30, rA3, rB0
1246
madd.d rC01, rC01, rA0, rB1
1248
madd.d rC11, rC11, rA1, rB1
1250
madd.d rC21, rC21, rA2, rB1
1252
madd.d rC31, rC31, rA3, rB1
1253
madd.d rC02, rC02, rA0, rB2
1254
madd.d rC12, rC12, rA1, rB2
1255
madd.d rC22, rC22, rA2, rB2
1256
madd.d rC32, rC32, rA3, rB2
1257
madd.d rC03, rC03, rA0, rB3
1258
madd.d rC13, rC13, rA1, rB3
1259
madd.d rC23, rC23, rA2, rB3
1260
madd.d rC33, rC33, rA3, rB3
1262
madd.d rC00, rC00, ra0, rb0
1264
madd.d rC10, rC10, ra1, rb0
1266
madd.d rC20, rC20, ra2, rb0
1268
madd.d rC30, rC30, ra3, rb0
1270
madd.d rC01, rC01, ra0, rb1
1272
madd.d rC11, rC11, ra1, rb1
1274
madd.d rC21, rC21, ra2, rb1
1276
madd.d rC31, rC31, ra3, rb1
1277
madd.d rC02, rC02, ra0, rb2
1278
madd.d rC12, rC12, ra1, rb2
1279
madd.d rC22, rC22, ra2, rb2
1280
madd.d rC32, rC32, ra3, rb2
1281
madd.d rC03, rC03, ra0, rb3
1282
madd.d rC13, rC13, ra1, rb3
1283
madd.d rC23, rC23, ra2, rb3
1284
madd.d rC33, rC33, ra3, rb3
1288
madd.d rC00, rC00, rA0, rB0
1290
madd.d rC10, rC10, rA1, rB0
1292
madd.d rC20, rC20, rA2, rB0
1294
madd.d rC30, rC30, rA3, rB0
1296
madd.d rC01, rC01, rA0, rB1
1298
madd.d rC11, rC11, rA1, rB1
1300
madd.d rC21, rC21, rA2, rB1
1302
madd.d rC31, rC31, rA3, rB1
1303
madd.d rC02, rC02, rA0, rB2
1304
madd.d rC12, rC12, rA1, rB2
1305
madd.d rC22, rC22, rA2, rB2
1306
madd.d rC32, rC32, rA3, rB2
1307
madd.d rC03, rC03, rA0, rB3
1308
madd.d rC13, rC13, rA1, rB3
1309
madd.d rC23, rC23, rA2, rB3
1310
madd.d rC33, rC33, rA3, rB3
1312
madd.d rC00, rC00, ra0, rb0
1314
madd.d rC10, rC10, ra1, rb0
1316
madd.d rC20, rC20, ra2, rb0
1318
madd.d rC30, rC30, ra3, rb0
1320
madd.d rC01, rC01, ra0, rb1
1322
madd.d rC11, rC11, ra1, rb1
1324
madd.d rC21, rC21, ra2, rb1
1326
madd.d rC31, rC31, ra3, rb1
1327
madd.d rC02, rC02, ra0, rb2
1328
madd.d rC12, rC12, ra1, rb2
1329
madd.d rC22, rC22, ra2, rb2
1330
madd.d rC32, rC32, ra3, rb2
1331
madd.d rC03, rC03, ra0, rb3
1332
madd.d rC13, rC13, ra1, rb3
1333
madd.d rC23, rC23, ra2, rb3
1334
madd.d rC33, rC33, ra3, rb3
1338
madd.d rC00, rC00, rA0, rB0
1340
madd.d rC10, rC10, rA1, rB0
1342
madd.d rC20, rC20, rA2, rB0
1344
madd.d rC30, rC30, rA3, rB0
1346
madd.d rC01, rC01, rA0, rB1
1348
madd.d rC11, rC11, rA1, rB1
1350
madd.d rC21, rC21, rA2, rB1
1352
madd.d rC31, rC31, rA3, rB1
1353
madd.d rC02, rC02, rA0, rB2
1354
madd.d rC12, rC12, rA1, rB2
1355
madd.d rC22, rC22, rA2, rB2
1356
madd.d rC32, rC32, rA3, rB2
1357
madd.d rC03, rC03, rA0, rB3
1358
madd.d rC13, rC13, rA1, rB3
1359
madd.d rC23, rC23, rA2, rB3
1360
madd.d rC33, rC33, rA3, rB3
1362
madd.d rC00, rC00, ra0, rb0
1364
madd.d rC10, rC10, ra1, rb0
1366
madd.d rC20, rC20, ra2, rb0
1368
madd.d rC30, rC30, ra3, rb0
1370
madd.d rC01, rC01, ra0, rb1
1372
madd.d rC11, rC11, ra1, rb1
1374
madd.d rC21, rC21, ra2, rb1
1376
madd.d rC31, rC31, ra3, rb1
1377
madd.d rC02, rC02, ra0, rb2
1378
madd.d rC12, rC12, ra1, rb2
1379
madd.d rC22, rC22, ra2, rb2
1380
madd.d rC32, rC32, ra3, rb2
1381
madd.d rC03, rC03, ra0, rb3
1382
madd.d rC13, rC13, ra1, rb3
1383
madd.d rC23, rC23, ra2, rb3
1384
madd.d rC33, rC33, ra3, rb3
1388
madd.d rC00, rC00, rA0, rB0
1390
madd.d rC10, rC10, rA1, rB0
1392
madd.d rC20, rC20, rA2, rB0
1394
madd.d rC30, rC30, rA3, rB0
1396
madd.d rC01, rC01, rA0, rB1
1398
madd.d rC11, rC11, rA1, rB1
1400
madd.d rC21, rC21, rA2, rB1
1402
madd.d rC31, rC31, rA3, rB1
1403
madd.d rC02, rC02, rA0, rB2
1404
madd.d rC12, rC12, rA1, rB2
1405
madd.d rC22, rC22, rA2, rB2
1406
madd.d rC32, rC32, rA3, rB2
1407
madd.d rC03, rC03, rA0, rB3
1408
madd.d rC13, rC13, rA1, rB3
1409
madd.d rC23, rC23, rA2, rB3
1410
madd.d rC33, rC33, rA3, rB3
1412
madd.d rC00, rC00, ra0, rb0
1414
madd.d rC10, rC10, ra1, rb0
1416
madd.d rC20, rC20, ra2, rb0
1418
madd.d rC30, rC30, ra3, rb0
1420
madd.d rC01, rC01, ra0, rb1
1422
madd.d rC11, rC11, ra1, rb1
1424
madd.d rC21, rC21, ra2, rb1
1426
madd.d rC31, rC31, ra3, rb1
1427
madd.d rC02, rC02, ra0, rb2
1428
madd.d rC12, rC12, ra1, rb2
1429
madd.d rC22, rC22, ra2, rb2
1430
madd.d rC32, rC32, ra3, rb2
1431
madd.d rC03, rC03, ra0, rb3
1432
madd.d rC13, rC13, ra1, rb3
1433
madd.d rC23, rC23, ra2, rb3
1434
madd.d rC33, rC33, ra3, rb3
1438
madd.d rC00, rC00, rA0, rB0
1440
madd.d rC10, rC10, rA1, rB0
1442
madd.d rC20, rC20, rA2, rB0
1444
madd.d rC30, rC30, rA3, rB0
1446
madd.d rC01, rC01, rA0, rB1
1448
madd.d rC11, rC11, rA1, rB1
1450
madd.d rC21, rC21, rA2, rB1
1452
madd.d rC31, rC31, rA3, rB1
1453
madd.d rC02, rC02, rA0, rB2
1454
madd.d rC12, rC12, rA1, rB2
1455
madd.d rC22, rC22, rA2, rB2
1456
madd.d rC32, rC32, rA3, rB2
1457
madd.d rC03, rC03, rA0, rB3
1458
madd.d rC13, rC13, rA1, rB3
1459
madd.d rC23, rC23, rA2, rB3
1460
madd.d rC33, rC33, rA3, rB3
1462
madd.d rC00, rC00, ra0, rb0
1464
madd.d rC10, rC10, ra1, rb0
1466
madd.d rC20, rC20, ra2, rb0
1468
madd.d rC30, rC30, ra3, rb0
1470
madd.d rC01, rC01, ra0, rb1
1472
madd.d rC11, rC11, ra1, rb1
1474
madd.d rC21, rC21, ra2, rb1
1476
madd.d rC31, rC31, ra3, rb1
1477
madd.d rC02, rC02, ra0, rb2
1478
madd.d rC12, rC12, ra1, rb2
1479
madd.d rC22, rC22, ra2, rb2
1480
madd.d rC32, rC32, ra3, rb2
1481
madd.d rC03, rC03, ra0, rb3
1482
madd.d rC13, rC13, ra1, rb3
1483
madd.d rC23, rC23, ra2, rb3
1484
madd.d rC33, rC33, ra3, rb3
1488
madd.d rC00, rC00, rA0, rB0
1490
madd.d rC10, rC10, rA1, rB0
1492
madd.d rC20, rC20, rA2, rB0
1494
madd.d rC30, rC30, rA3, rB0
1496
madd.d rC01, rC01, rA0, rB1
1498
madd.d rC11, rC11, rA1, rB1
1500
madd.d rC21, rC21, rA2, rB1
1502
madd.d rC31, rC31, rA3, rB1
1503
madd.d rC02, rC02, rA0, rB2
1504
madd.d rC12, rC12, rA1, rB2
1505
madd.d rC22, rC22, rA2, rB2
1506
madd.d rC32, rC32, rA3, rB2
1507
madd.d rC03, rC03, rA0, rB3
1508
madd.d rC13, rC13, rA1, rB3
1509
madd.d rC23, rC23, rA2, rB3
1510
madd.d rC33, rC33, rA3, rB3
1512
madd.d rC00, rC00, ra0, rb0
1514
madd.d rC10, rC10, ra1, rb0
1516
madd.d rC20, rC20, ra2, rb0
1518
madd.d rC30, rC30, ra3, rb0
1520
madd.d rC01, rC01, ra0, rb1
1522
madd.d rC11, rC11, ra1, rb1
1524
madd.d rC21, rC21, ra2, rb1
1526
madd.d rC31, rC31, ra3, rb1
1527
madd.d rC02, rC02, ra0, rb2
1528
madd.d rC12, rC12, ra1, rb2
1529
madd.d rC22, rC22, ra2, rb2
1530
madd.d rC32, rC32, ra3, rb2
1531
madd.d rC03, rC03, ra0, rb3
1532
madd.d rC13, rC13, ra1, rb3
1533
madd.d rC23, rC23, ra2, rb3
1534
madd.d rC33, rC33, ra3, rb3
1538
madd.d rC00, rC00, rA0, rB0
1540
madd.d rC10, rC10, rA1, rB0
1542
madd.d rC20, rC20, rA2, rB0
1544
madd.d rC30, rC30, rA3, rB0
1546
madd.d rC01, rC01, rA0, rB1
1548
madd.d rC11, rC11, rA1, rB1
1550
madd.d rC21, rC21, rA2, rB1
1552
madd.d rC31, rC31, rA3, rB1
1553
madd.d rC02, rC02, rA0, rB2
1554
madd.d rC12, rC12, rA1, rB2
1555
madd.d rC22, rC22, rA2, rB2
1556
madd.d rC32, rC32, rA3, rB2
1557
madd.d rC03, rC03, rA0, rB3
1558
madd.d rC13, rC13, rA1, rB3
1559
madd.d rC23, rC23, rA2, rB3
1560
madd.d rC33, rC33, rA3, rB3
1562
madd.d rC00, rC00, ra0, rb0
1564
madd.d rC10, rC10, ra1, rb0
1566
madd.d rC20, rC20, ra2, rb0
1568
madd.d rC30, rC30, ra3, rb0
1570
madd.d rC01, rC01, ra0, rb1
1572
madd.d rC11, rC11, ra1, rb1
1574
madd.d rC21, rC21, ra2, rb1
1576
madd.d rC31, rC31, ra3, rb1
1577
madd.d rC02, rC02, ra0, rb2
1578
madd.d rC12, rC12, ra1, rb2
1579
madd.d rC22, rC22, ra2, rb2
1580
madd.d rC32, rC32, ra3, rb2
1581
madd.d rC03, rC03, ra0, rb3
1582
madd.d rC13, rC13, ra1, rb3
1583
madd.d rC23, rC23, ra2, rb3
1584
madd.d rC33, rC33, ra3, rb3
1588
madd.d rC00, rC00, rA0, rB0
1590
madd.d rC10, rC10, rA1, rB0
1592
madd.d rC20, rC20, rA2, rB0
1594
madd.d rC30, rC30, rA3, rB0
1596
madd.d rC01, rC01, rA0, rB1
1598
madd.d rC11, rC11, rA1, rB1
1600
madd.d rC21, rC21, rA2, rB1
1602
madd.d rC31, rC31, rA3, rB1
1603
madd.d rC02, rC02, rA0, rB2
1604
madd.d rC12, rC12, rA1, rB2
1605
madd.d rC22, rC22, rA2, rB2
1606
madd.d rC32, rC32, rA3, rB2
1607
madd.d rC03, rC03, rA0, rB3
1608
madd.d rC13, rC13, rA1, rB3
1609
madd.d rC23, rC23, rA2, rB3
1610
madd.d rC33, rC33, rA3, rB3
1612
madd.d rC00, rC00, ra0, rb0
1614
madd.d rC10, rC10, ra1, rb0
1616
madd.d rC20, rC20, ra2, rb0
1618
madd.d rC30, rC30, ra3, rb0
1620
madd.d rC01, rC01, ra0, rb1
1622
madd.d rC11, rC11, ra1, rb1
1624
madd.d rC21, rC21, ra2, rb1
1626
madd.d rC31, rC31, ra3, rb1
1627
madd.d rC02, rC02, ra0, rb2
1628
madd.d rC12, rC12, ra1, rb2
1629
madd.d rC22, rC22, ra2, rb2
1630
madd.d rC32, rC32, ra3, rb2
1631
madd.d rC03, rC03, ra0, rb3
1632
madd.d rC13, rC13, ra1, rb3
1633
madd.d rC23, rC23, ra2, rb3
1634
madd.d rC33, rC33, ra3, rb3
1638
madd.d rC00, rC00, rA0, rB0
1640
madd.d rC10, rC10, rA1, rB0
1642
madd.d rC20, rC20, rA2, rB0
1644
madd.d rC30, rC30, rA3, rB0
1646
madd.d rC01, rC01, rA0, rB1
1648
madd.d rC11, rC11, rA1, rB1
1650
madd.d rC21, rC21, rA2, rB1
1652
madd.d rC31, rC31, rA3, rB1
1653
madd.d rC02, rC02, rA0, rB2
1654
madd.d rC12, rC12, rA1, rB2
1655
madd.d rC22, rC22, rA2, rB2
1656
madd.d rC32, rC32, rA3, rB2
1657
madd.d rC03, rC03, rA0, rB3
1658
madd.d rC13, rC13, rA1, rB3
1659
madd.d rC23, rC23, rA2, rB3
1660
madd.d rC33, rC33, rA3, rB3
1662
madd.d rC00, rC00, ra0, rb0
1664
madd.d rC10, rC10, ra1, rb0
1666
madd.d rC20, rC20, ra2, rb0
1668
madd.d rC30, rC30, ra3, rb0
1670
madd.d rC01, rC01, ra0, rb1
1672
madd.d rC11, rC11, ra1, rb1
1674
madd.d rC21, rC21, ra2, rb1
1676
madd.d rC31, rC31, ra3, rb1
1677
madd.d rC02, rC02, ra0, rb2
1678
madd.d rC12, rC12, ra1, rb2
1679
madd.d rC22, rC22, ra2, rb2
1680
madd.d rC32, rC32, ra3, rb2
1681
madd.d rC03, rC03, ra0, rb3
1682
madd.d rC13, rC13, ra1, rb3
1683
madd.d rC23, rC23, ra2, rb3
1684
madd.d rC33, rC33, ra3, rb3
1688
madd.d rC00, rC00, rA0, rB0
1690
madd.d rC10, rC10, rA1, rB0
1692
madd.d rC20, rC20, rA2, rB0
1694
madd.d rC30, rC30, rA3, rB0
1696
madd.d rC01, rC01, rA0, rB1
1698
madd.d rC11, rC11, rA1, rB1
1700
madd.d rC21, rC21, rA2, rB1
1702
madd.d rC31, rC31, rA3, rB1
1703
madd.d rC02, rC02, rA0, rB2
1704
madd.d rC12, rC12, rA1, rB2
1705
madd.d rC22, rC22, rA2, rB2
1706
madd.d rC32, rC32, rA3, rB2
1707
madd.d rC03, rC03, rA0, rB3
1708
madd.d rC13, rC13, rA1, rB3
1709
madd.d rC23, rC23, rA2, rB3
1710
madd.d rC33, rC33, rA3, rB3
1712
madd.d rC00, rC00, ra0, rb0
1714
madd.d rC10, rC10, ra1, rb0
1716
madd.d rC20, rC20, ra2, rb0
1718
madd.d rC30, rC30, ra3, rb0
1720
madd.d rC01, rC01, ra0, rb1
1722
madd.d rC11, rC11, ra1, rb1
1724
madd.d rC21, rC21, ra2, rb1
1726
madd.d rC31, rC31, ra3, rb1
1727
madd.d rC02, rC02, ra0, rb2
1728
madd.d rC12, rC12, ra1, rb2
1729
madd.d rC22, rC22, ra2, rb2
1730
madd.d rC32, rC32, ra3, rb2
1731
madd.d rC03, rC03, ra0, rb3
1732
madd.d rC13, rC13, ra1, rb3
1733
madd.d rC23, rC23, ra2, rb3
1734
madd.d rC33, rC33, ra3, rb3
1738
madd.d rC00, rC00, rA0, rB0
1740
madd.d rC10, rC10, rA1, rB0
1742
madd.d rC20, rC20, rA2, rB0
1744
madd.d rC30, rC30, rA3, rB0
1746
madd.d rC01, rC01, rA0, rB1
1748
madd.d rC11, rC11, rA1, rB1
1750
madd.d rC21, rC21, rA2, rB1
1752
madd.d rC31, rC31, rA3, rB1
1753
madd.d rC02, rC02, rA0, rB2
1754
madd.d rC12, rC12, rA1, rB2
1755
madd.d rC22, rC22, rA2, rB2
1756
madd.d rC32, rC32, rA3, rB2
1757
madd.d rC03, rC03, rA0, rB3
1758
madd.d rC13, rC13, rA1, rB3
1759
madd.d rC23, rC23, rA2, rB3
1760
madd.d rC33, rC33, rA3, rB3
1762
madd.d rC00, rC00, ra0, rb0
1764
madd.d rC10, rC10, ra1, rb0
1766
madd.d rC20, rC20, ra2, rb0
1768
madd.d rC30, rC30, ra3, rb0
1770
madd.d rC01, rC01, ra0, rb1
1772
madd.d rC11, rC11, ra1, rb1
1774
madd.d rC21, rC21, ra2, rb1
1776
madd.d rC31, rC31, ra3, rb1
1777
madd.d rC02, rC02, ra0, rb2
1778
madd.d rC12, rC12, ra1, rb2
1779
madd.d rC22, rC22, ra2, rb2
1780
madd.d rC32, rC32, ra3, rb2
1781
madd.d rC03, rC03, ra0, rb3
1782
madd.d rC13, rC13, ra1, rb3
1783
madd.d rC23, rC23, ra2, rb3
1784
madd.d rC33, rC33, ra3, rb3
1788
madd.d rC00, rC00, rA0, rB0
1790
madd.d rC10, rC10, rA1, rB0
1792
madd.d rC20, rC20, rA2, rB0
1794
madd.d rC30, rC30, rA3, rB0
1796
madd.d rC01, rC01, rA0, rB1
1798
madd.d rC11, rC11, rA1, rB1
1800
madd.d rC21, rC21, rA2, rB1
1802
madd.d rC31, rC31, rA3, rB1
1803
madd.d rC02, rC02, rA0, rB2
1804
madd.d rC12, rC12, rA1, rB2
1805
madd.d rC22, rC22, rA2, rB2
1806
madd.d rC32, rC32, rA3, rB2
1807
madd.d rC03, rC03, rA0, rB3
1808
madd.d rC13, rC13, rA1, rB3
1809
madd.d rC23, rC23, rA2, rB3
1810
madd.d rC33, rC33, rA3, rB3
1812
madd.d rC00, rC00, ra0, rb0
1814
madd.d rC10, rC10, ra1, rb0
1816
madd.d rC20, rC20, ra2, rb0
1818
madd.d rC30, rC30, ra3, rb0
1820
madd.d rC01, rC01, ra0, rb1
1822
madd.d rC11, rC11, ra1, rb1
1824
madd.d rC21, rC21, ra2, rb1
1826
madd.d rC31, rC31, ra3, rb1
1827
madd.d rC02, rC02, ra0, rb2
1828
madd.d rC12, rC12, ra1, rb2
1829
madd.d rC22, rC22, ra2, rb2
1830
madd.d rC32, rC32, ra3, rb2
1831
madd.d rC03, rC03, ra0, rb3
1832
madd.d rC13, rC13, ra1, rb3
1833
madd.d rC23, rC23, ra2, rb3
1834
madd.d rC33, rC33, ra3, rb3
1838
madd.d rC00, rC00, rA0, rB0
1840
madd.d rC10, rC10, rA1, rB0
1842
madd.d rC20, rC20, rA2, rB0
1844
madd.d rC30, rC30, rA3, rB0
1846
madd.d rC01, rC01, rA0, rB1
1848
madd.d rC11, rC11, rA1, rB1
1850
madd.d rC21, rC21, rA2, rB1
1852
madd.d rC31, rC31, rA3, rB1
1853
madd.d rC02, rC02, rA0, rB2
1854
madd.d rC12, rC12, rA1, rB2
1855
madd.d rC22, rC22, rA2, rB2
1856
madd.d rC32, rC32, rA3, rB2
1857
madd.d rC03, rC03, rA0, rB3
1858
madd.d rC13, rC13, rA1, rB3
1859
madd.d rC23, rC23, rA2, rB3
1860
madd.d rC33, rC33, rA3, rB3
1862
madd.d rC00, rC00, ra0, rb0
1864
madd.d rC10, rC10, ra1, rb0
1866
madd.d rC20, rC20, ra2, rb0
1868
madd.d rC30, rC30, ra3, rb0
1870
madd.d rC01, rC01, ra0, rb1
1872
madd.d rC11, rC11, ra1, rb1
1874
madd.d rC21, rC21, ra2, rb1
1876
madd.d rC31, rC31, ra3, rb1
1877
madd.d rC02, rC02, ra0, rb2
1878
madd.d rC12, rC12, ra1, rb2
1879
madd.d rC22, rC22, ra2, rb2
1880
madd.d rC32, rC32, ra3, rb2
1881
madd.d rC03, rC03, ra0, rb3
1882
madd.d rC13, rC13, ra1, rb3
1883
madd.d rC23, rC23, ra2, rb3
1884
madd.d rC33, rC33, ra3, rb3
1888
madd.d rC00, rC00, rA0, rB0
1890
madd.d rC10, rC10, rA1, rB0
1892
madd.d rC20, rC20, rA2, rB0
1894
madd.d rC30, rC30, rA3, rB0
1896
madd.d rC01, rC01, rA0, rB1
1898
madd.d rC11, rC11, rA1, rB1
1900
madd.d rC21, rC21, rA2, rB1
1902
madd.d rC31, rC31, rA3, rB1
1903
madd.d rC02, rC02, rA0, rB2
1904
madd.d rC12, rC12, rA1, rB2
1905
madd.d rC22, rC22, rA2, rB2
1906
madd.d rC32, rC32, rA3, rB2
1907
madd.d rC03, rC03, rA0, rB3
1908
madd.d rC13, rC13, rA1, rB3
1909
madd.d rC23, rC23, rA2, rB3
1910
madd.d rC33, rC33, rA3, rB3
1912
madd.d rC00, rC00, ra0, rb0
1914
madd.d rC10, rC10, ra1, rb0
1916
madd.d rC20, rC20, ra2, rb0
1918
madd.d rC30, rC30, ra3, rb0
1920
madd.d rC01, rC01, ra0, rb1
1922
madd.d rC11, rC11, ra1, rb1
1924
madd.d rC21, rC21, ra2, rb1
1926
madd.d rC31, rC31, ra3, rb1
1927
madd.d rC02, rC02, ra0, rb2
1928
madd.d rC12, rC12, ra1, rb2
1929
madd.d rC22, rC22, ra2, rb2
1930
madd.d rC32, rC32, ra3, rb2
1931
madd.d rC03, rC03, ra0, rb3
1932
madd.d rC13, rC13, ra1, rb3
1933
madd.d rC23, rC23, ra2, rb3
1934
madd.d rC33, rC33, ra3, rb3
1938
madd.d rC00, rC00, rA0, rB0
1940
madd.d rC10, rC10, rA1, rB0
1942
madd.d rC20, rC20, rA2, rB0
1944
madd.d rC30, rC30, rA3, rB0
1946
madd.d rC01, rC01, rA0, rB1
1948
madd.d rC11, rC11, rA1, rB1
1950
madd.d rC21, rC21, rA2, rB1
1952
madd.d rC31, rC31, rA3, rB1
1953
madd.d rC02, rC02, rA0, rB2
1954
madd.d rC12, rC12, rA1, rB2
1955
madd.d rC22, rC22, rA2, rB2
1956
madd.d rC32, rC32, rA3, rB2
1957
madd.d rC03, rC03, rA0, rB3
1958
madd.d rC13, rC13, rA1, rB3
1959
madd.d rC23, rC23, rA2, rB3
1960
madd.d rC33, rC33, rA3, rB3
1962
madd.d rC00, rC00, ra0, rb0
1964
madd.d rC10, rC10, ra1, rb0
1966
madd.d rC20, rC20, ra2, rb0
1968
madd.d rC30, rC30, ra3, rb0
1970
madd.d rC01, rC01, ra0, rb1
1972
madd.d rC11, rC11, ra1, rb1
1974
madd.d rC21, rC21, ra2, rb1
1976
madd.d rC31, rC31, ra3, rb1
1977
madd.d rC02, rC02, ra0, rb2
1978
madd.d rC12, rC12, ra1, rb2
1979
madd.d rC22, rC22, ra2, rb2
1980
madd.d rC32, rC32, ra3, rb2
1981
madd.d rC03, rC03, ra0, rb3
1982
madd.d rC13, rC13, ra1, rb3
1983
madd.d rC23, rC23, ra2, rb3
1984
madd.d rC33, rC33, ra3, rb3
1988
madd.d rC00, rC00, rA0, rB0
1990
madd.d rC10, rC10, rA1, rB0
1992
madd.d rC20, rC20, rA2, rB0
1994
madd.d rC30, rC30, rA3, rB0
1996
madd.d rC01, rC01, rA0, rB1
1998
madd.d rC11, rC11, rA1, rB1
2000
madd.d rC21, rC21, rA2, rB1
2002
madd.d rC31, rC31, rA3, rB1
2003
madd.d rC02, rC02, rA0, rB2
2004
madd.d rC12, rC12, rA1, rB2
2005
madd.d rC22, rC22, rA2, rB2
2006
madd.d rC32, rC32, rA3, rB2
2007
madd.d rC03, rC03, rA0, rB3
2008
madd.d rC13, rC13, rA1, rB3
2009
madd.d rC23, rC23, rA2, rB3
2010
madd.d rC33, rC33, rA3, rB3
2012
madd.d rC00, rC00, ra0, rb0
2014
madd.d rC10, rC10, ra1, rb0
2016
madd.d rC20, rC20, ra2, rb0
2018
madd.d rC30, rC30, ra3, rb0
2020
madd.d rC01, rC01, ra0, rb1
2022
madd.d rC11, rC11, ra1, rb1
2024
madd.d rC21, rC21, ra2, rb1
2026
madd.d rC31, rC31, ra3, rb1
2027
madd.d rC02, rC02, ra0, rb2
2028
madd.d rC12, rC12, ra1, rb2
2029
madd.d rC22, rC22, ra2, rb2
2030
madd.d rC32, rC32, ra3, rb2
2031
madd.d rC03, rC03, ra0, rb3
2032
madd.d rC13, rC13, ra1, rb3
2033
madd.d rC23, rC23, ra2, rb3
2034
madd.d rC33, rC33, ra3, rb3
2038
madd.d rC00, rC00, rA0, rB0
2040
madd.d rC10, rC10, rA1, rB0
2042
madd.d rC20, rC20, rA2, rB0
2044
madd.d rC30, rC30, rA3, rB0
2046
madd.d rC01, rC01, rA0, rB1
2048
madd.d rC11, rC11, rA1, rB1
2050
madd.d rC21, rC21, rA2, rB1
2052
madd.d rC31, rC31, rA3, rB1
2053
madd.d rC02, rC02, rA0, rB2
2054
madd.d rC12, rC12, rA1, rB2
2055
madd.d rC22, rC22, rA2, rB2
2056
madd.d rC32, rC32, rA3, rB2
2057
madd.d rC03, rC03, rA0, rB3
2058
madd.d rC13, rC13, rA1, rB3
2059
madd.d rC23, rC23, rA2, rB3
2060
madd.d rC33, rC33, rA3, rB3
2062
madd.d rC00, rC00, ra0, rb0
2064
madd.d rC10, rC10, ra1, rb0
2066
madd.d rC20, rC20, ra2, rb0
2068
madd.d rC30, rC30, ra3, rb0
2070
madd.d rC01, rC01, ra0, rb1
2072
madd.d rC11, rC11, ra1, rb1
2074
madd.d rC21, rC21, ra2, rb1
2076
madd.d rC31, rC31, ra3, rb1
2077
madd.d rC02, rC02, ra0, rb2
2078
madd.d rC12, rC12, ra1, rb2
2079
madd.d rC22, rC22, ra2, rb2
2080
madd.d rC32, rC32, ra3, rb2
2081
madd.d rC03, rC03, ra0, rb3
2082
madd.d rC13, rC13, ra1, rb3
2083
madd.d rC23, rC23, ra2, rb3
2084
madd.d rC33, rC33, ra3, rb3
2088
madd.d rC00, rC00, rA0, rB0
2090
madd.d rC10, rC10, rA1, rB0
2092
madd.d rC20, rC20, rA2, rB0
2094
madd.d rC30, rC30, rA3, rB0
2096
madd.d rC01, rC01, rA0, rB1
2098
madd.d rC11, rC11, rA1, rB1
2100
madd.d rC21, rC21, rA2, rB1
2102
madd.d rC31, rC31, rA3, rB1
2103
madd.d rC02, rC02, rA0, rB2
2104
madd.d rC12, rC12, rA1, rB2
2105
madd.d rC22, rC22, rA2, rB2
2106
madd.d rC32, rC32, rA3, rB2
2107
madd.d rC03, rC03, rA0, rB3
2108
madd.d rC13, rC13, rA1, rB3
2109
madd.d rC23, rC23, rA2, rB3
2110
madd.d rC33, rC33, rA3, rB3
2112
madd.d rC00, rC00, ra0, rb0
2114
madd.d rC10, rC10, ra1, rb0
2116
madd.d rC20, rC20, ra2, rb0
2118
madd.d rC30, rC30, ra3, rb0
2120
madd.d rC01, rC01, ra0, rb1
2122
madd.d rC11, rC11, ra1, rb1
2124
madd.d rC21, rC21, ra2, rb1
2126
madd.d rC31, rC31, ra3, rb1
2127
madd.d rC02, rC02, ra0, rb2
2128
madd.d rC12, rC12, ra1, rb2
2129
madd.d rC22, rC22, ra2, rb2
2130
madd.d rC32, rC32, ra3, rb2
2131
madd.d rC03, rC03, ra0, rb3
2132
madd.d rC13, rC13, ra1, rb3
2133
madd.d rC23, rC23, ra2, rb3
2134
madd.d rC33, rC33, ra3, rb3
2138
madd.d rC00, rC00, rA0, rB0
2140
madd.d rC10, rC10, rA1, rB0
2142
madd.d rC20, rC20, rA2, rB0
2144
madd.d rC30, rC30, rA3, rB0
2146
madd.d rC01, rC01, rA0, rB1
2148
madd.d rC11, rC11, rA1, rB1
2150
madd.d rC21, rC21, rA2, rB1
2152
madd.d rC31, rC31, rA3, rB1
2153
madd.d rC02, rC02, rA0, rB2
2154
madd.d rC12, rC12, rA1, rB2
2155
madd.d rC22, rC22, rA2, rB2
2156
madd.d rC32, rC32, rA3, rB2
2157
madd.d rC03, rC03, rA0, rB3
2158
madd.d rC13, rC13, rA1, rB3
2159
madd.d rC23, rC23, rA2, rB3
2160
madd.d rC33, rC33, rA3, rB3
2162
madd.d rC00, rC00, ra0, rb0
2164
madd.d rC10, rC10, ra1, rb0
2166
madd.d rC20, rC20, ra2, rb0
2168
madd.d rC30, rC30, ra3, rb0
2170
madd.d rC01, rC01, ra0, rb1
2172
madd.d rC11, rC11, ra1, rb1
2174
madd.d rC21, rC21, ra2, rb1
2176
madd.d rC31, rC31, ra3, rb1
2177
madd.d rC02, rC02, ra0, rb2
2178
madd.d rC12, rC12, ra1, rb2
2179
madd.d rC22, rC22, ra2, rb2
2180
madd.d rC32, rC32, ra3, rb2
2181
madd.d rC03, rC03, ra0, rb3
2182
madd.d rC13, rC13, ra1, rb3
2183
madd.d rC23, rC23, ra2, rb3
2184
madd.d rC33, rC33, ra3, rb3
2188
madd.d rC00, rC00, rA0, rB0
2190
madd.d rC10, rC10, rA1, rB0
2192
madd.d rC20, rC20, rA2, rB0
2194
madd.d rC30, rC30, rA3, rB0
2196
madd.d rC01, rC01, rA0, rB1
2198
madd.d rC11, rC11, rA1, rB1
2200
madd.d rC21, rC21, rA2, rB1
2202
madd.d rC31, rC31, rA3, rB1
2203
madd.d rC02, rC02, rA0, rB2
2204
madd.d rC12, rC12, rA1, rB2
2205
madd.d rC22, rC22, rA2, rB2
2206
madd.d rC32, rC32, rA3, rB2
2207
madd.d rC03, rC03, rA0, rB3
2208
madd.d rC13, rC13, rA1, rB3
2209
madd.d rC23, rC23, rA2, rB3
2210
madd.d rC33, rC33, rA3, rB3
2212
madd.d rC00, rC00, ra0, rb0
2214
madd.d rC10, rC10, ra1, rb0
2216
madd.d rC20, rC20, ra2, rb0
2218
madd.d rC30, rC30, ra3, rb0
2220
madd.d rC01, rC01, ra0, rb1
2222
madd.d rC11, rC11, ra1, rb1
2224
madd.d rC21, rC21, ra2, rb1
2226
madd.d rC31, rC31, ra3, rb1
2227
madd.d rC02, rC02, ra0, rb2
2228
madd.d rC12, rC12, ra1, rb2
2229
madd.d rC22, rC22, ra2, rb2
2230
madd.d rC32, rC32, ra3, rb2
2231
madd.d rC03, rC03, ra0, rb3
2232
madd.d rC13, rC13, ra1, rb3
2233
madd.d rC23, rC23, ra2, rb3
2234
madd.d rC33, rC33, ra3, rb3
2238
madd.d rC00, rC00, rA0, rB0
2240
madd.d rC10, rC10, rA1, rB0
2242
madd.d rC20, rC20, rA2, rB0
2244
madd.d rC30, rC30, rA3, rB0
2246
madd.d rC01, rC01, rA0, rB1
2248
madd.d rC11, rC11, rA1, rB1
2250
madd.d rC21, rC21, rA2, rB1
2252
madd.d rC31, rC31, rA3, rB1
2253
madd.d rC02, rC02, rA0, rB2
2254
madd.d rC12, rC12, rA1, rB2
2255
madd.d rC22, rC22, rA2, rB2
2256
madd.d rC32, rC32, rA3, rB2
2257
madd.d rC03, rC03, rA0, rB3
2258
madd.d rC13, rC13, rA1, rB3
2259
madd.d rC23, rC23, rA2, rB3
2260
madd.d rC33, rC33, rA3, rB3
2262
madd.d rC00, rC00, ra0, rb0
2264
madd.d rC10, rC10, ra1, rb0
2266
madd.d rC20, rC20, ra2, rb0
2268
madd.d rC30, rC30, ra3, rb0
2270
madd.d rC01, rC01, ra0, rb1
2272
madd.d rC11, rC11, ra1, rb1
2274
madd.d rC21, rC21, ra2, rb1
2276
madd.d rC31, rC31, ra3, rb1
2277
madd.d rC02, rC02, ra0, rb2
2278
madd.d rC12, rC12, ra1, rb2
2279
madd.d rC22, rC22, ra2, rb2
2280
madd.d rC32, rC32, ra3, rb2
2281
madd.d rC03, rC03, ra0, rb3
2282
madd.d rC13, rC13, ra1, rb3
2283
madd.d rC23, rC23, ra2, rb3
2284
madd.d rC33, rC33, ra3, rb3
2288
madd.d rC00, rC00, rA0, rB0
2290
madd.d rC10, rC10, rA1, rB0
2292
madd.d rC20, rC20, rA2, rB0
2294
madd.d rC30, rC30, rA3, rB0
2296
madd.d rC01, rC01, rA0, rB1
2298
madd.d rC11, rC11, rA1, rB1
2300
madd.d rC21, rC21, rA2, rB1
2302
madd.d rC31, rC31, rA3, rB1
2303
madd.d rC02, rC02, rA0, rB2
2304
madd.d rC12, rC12, rA1, rB2
2305
madd.d rC22, rC22, rA2, rB2
2306
madd.d rC32, rC32, rA3, rB2
2307
madd.d rC03, rC03, rA0, rB3
2308
madd.d rC13, rC13, rA1, rB3
2309
madd.d rC23, rC23, rA2, rB3
2310
madd.d rC33, rC33, rA3, rB3
2312
madd.d rC00, rC00, ra0, rb0
2314
madd.d rC10, rC10, ra1, rb0
2316
madd.d rC20, rC20, ra2, rb0
2318
madd.d rC30, rC30, ra3, rb0
2320
madd.d rC01, rC01, ra0, rb1
2322
madd.d rC11, rC11, ra1, rb1
2324
madd.d rC21, rC21, ra2, rb1
2326
madd.d rC31, rC31, ra3, rb1
2327
madd.d rC02, rC02, ra0, rb2
2328
madd.d rC12, rC12, ra1, rb2
2329
madd.d rC22, rC22, ra2, rb2
2330
madd.d rC32, rC32, ra3, rb2
2331
madd.d rC03, rC03, ra0, rb3
2332
madd.d rC13, rC13, ra1, rb3
2333
madd.d rC23, rC23, ra2, rb3
2334
madd.d rC33, rC33, ra3, rb3
2338
madd.d rC00, rC00, rA0, rB0
2340
madd.d rC10, rC10, rA1, rB0
2342
madd.d rC20, rC20, rA2, rB0
2344
madd.d rC30, rC30, rA3, rB0
2346
madd.d rC01, rC01, rA0, rB1
2348
madd.d rC11, rC11, rA1, rB1
2350
madd.d rC21, rC21, rA2, rB1
2352
madd.d rC31, rC31, rA3, rB1
2353
madd.d rC02, rC02, rA0, rB2
2354
madd.d rC12, rC12, rA1, rB2
2355
madd.d rC22, rC22, rA2, rB2
2356
madd.d rC32, rC32, rA3, rB2
2357
madd.d rC03, rC03, rA0, rB3
2358
madd.d rC13, rC13, rA1, rB3
2359
madd.d rC23, rC23, rA2, rB3
2360
madd.d rC33, rC33, rA3, rB3
2362
madd.d rC00, rC00, ra0, rb0
2364
madd.d rC10, rC10, ra1, rb0
2366
madd.d rC20, rC20, ra2, rb0
2368
madd.d rC30, rC30, ra3, rb0
2370
madd.d rC01, rC01, ra0, rb1
2372
madd.d rC11, rC11, ra1, rb1
2374
madd.d rC21, rC21, ra2, rb1
2376
madd.d rC31, rC31, ra3, rb1
2377
madd.d rC02, rC02, ra0, rb2
2378
madd.d rC12, rC12, ra1, rb2
2379
madd.d rC22, rC22, ra2, rb2
2380
madd.d rC32, rC32, ra3, rb2
2381
madd.d rC03, rC03, ra0, rb3
2382
madd.d rC13, rC13, ra1, rb3
2383
madd.d rC23, rC23, ra2, rb3
2384
madd.d rC33, rC33, ra3, rb3
2388
madd.d rC00, rC00, rA0, rB0
2390
madd.d rC10, rC10, rA1, rB0
2392
madd.d rC20, rC20, rA2, rB0
2394
madd.d rC30, rC30, rA3, rB0
2396
madd.d rC01, rC01, rA0, rB1
2398
madd.d rC11, rC11, rA1, rB1
2400
madd.d rC21, rC21, rA2, rB1
2402
madd.d rC31, rC31, rA3, rB1
2403
madd.d rC02, rC02, rA0, rB2
2404
madd.d rC12, rC12, rA1, rB2
2405
madd.d rC22, rC22, rA2, rB2
2406
madd.d rC32, rC32, rA3, rB2
2407
madd.d rC03, rC03, rA0, rB3
2408
madd.d rC13, rC13, rA1, rB3
2409
madd.d rC23, rC23, rA2, rB3
2410
madd.d rC33, rC33, rA3, rB3
2412
madd.d rC00, rC00, ra0, rb0
2414
madd.d rC10, rC10, ra1, rb0
2416
madd.d rC20, rC20, ra2, rb0
2418
madd.d rC30, rC30, ra3, rb0
2420
madd.d rC01, rC01, ra0, rb1
2422
madd.d rC11, rC11, ra1, rb1
2424
madd.d rC21, rC21, ra2, rb1
2426
madd.d rC31, rC31, ra3, rb1
2427
madd.d rC02, rC02, ra0, rb2
2428
madd.d rC12, rC12, ra1, rb2
2429
madd.d rC22, rC22, ra2, rb2
2430
madd.d rC32, rC32, ra3, rb2
2431
madd.d rC03, rC03, ra0, rb3
2432
madd.d rC13, rC13, ra1, rb3
2433
madd.d rC23, rC23, ra2, rb3
2434
madd.d rC33, rC33, ra3, rb3
2438
madd.d rC00, rC00, rA0, rB0
2440
madd.d rC10, rC10, rA1, rB0
2442
madd.d rC20, rC20, rA2, rB0
2444
madd.d rC30, rC30, rA3, rB0
2446
madd.d rC01, rC01, rA0, rB1
2448
madd.d rC11, rC11, rA1, rB1
2450
madd.d rC21, rC21, rA2, rB1
2452
madd.d rC31, rC31, rA3, rB1
2453
madd.d rC02, rC02, rA0, rB2
2454
madd.d rC12, rC12, rA1, rB2
2455
madd.d rC22, rC22, rA2, rB2
2456
madd.d rC32, rC32, rA3, rB2
2457
madd.d rC03, rC03, rA0, rB3
2458
madd.d rC13, rC13, rA1, rB3
2459
madd.d rC23, rC23, rA2, rB3
2460
madd.d rC33, rC33, rA3, rB3
2462
madd.d rC00, rC00, ra0, rb0
2464
madd.d rC10, rC10, ra1, rb0
2466
madd.d rC20, rC20, ra2, rb0
2468
madd.d rC30, rC30, ra3, rb0
2470
madd.d rC01, rC01, ra0, rb1
2472
madd.d rC11, rC11, ra1, rb1
2474
madd.d rC21, rC21, ra2, rb1
2476
madd.d rC31, rC31, ra3, rb1
2477
madd.d rC02, rC02, ra0, rb2
2478
madd.d rC12, rC12, ra1, rb2
2479
madd.d rC22, rC22, ra2, rb2
2480
madd.d rC32, rC32, ra3, rb2
2481
madd.d rC03, rC03, ra0, rb3
2482
madd.d rC13, rC13, ra1, rb3
2483
madd.d rC23, rC23, ra2, rb3
2484
madd.d rC33, rC33, ra3, rb3
2488
madd.d rC33, rC33, ra3, rb3 // in delay slot!
2494
ldc1 rb0, KB*8-8(pB0)
2495
madd.d rC00, rC00, rA0, rB0
2496
ldc1 ra0, KB*8-8(pA0)
2497
madd.d rC10, rC10, rA1, rB0
2498
ldc1 ra1, KB*8-8(pA1)
2499
madd.d rC20, rC20, rA2, rB0
2500
ldc1 ra2, KB*8-8(pA2)
2501
madd.d rC30, rC30, rA3, rB0
2502
ldc1 ra3, KB*8-8(pA3)
2503
madd.d rC01, rC01, rA0, rB1
2504
ldc1 rb1, KB*8-8(pB1)
2505
madd.d rC11, rC11, rA1, rB1
2506
ldc1 rb2, KB*8-8(pB2)
2507
madd.d rC21, rC21, rA2, rB1
2508
ldc1 rb3, KB*8-8(pB3)
2509
madd.d rC31, rC31, rA3, rB1
2510
daddu pA0, pA0, incAm
2511
madd.d rC02, rC02, rA0, rB2
2512
daddu pA1, pA1, incAm
2513
madd.d rC12, rC12, rA1, rB2
2514
daddu pA2, pA2, incAm
2515
madd.d rC22, rC22, rA2, rB2
2516
daddu pA3, pA3, incAm
2517
madd.d rC32, rC32, rA3, rB2
2518
daddiu pC0, pC0, CMUL(32)
2519
madd.d rC03, rC03, rA0, rB3
2520
daddiu pC1, pC1, CMUL(32)
2521
madd.d rC13, rC13, rA1, rB3
2522
daddiu pC2, pC2, CMUL(32)
2523
madd.d rC23, rC23, rA2, rB3
2524
daddiu pC3, pC3, CMUL(32)
2525
madd.d rC33, rC33, rA3, rB3
2527
madd.d rC00, rC00, ra0, rb0
2528
madd.d rC10, rC10, ra1, rb0
2529
madd.d rC20, rC20, ra2, rb0
2530
madd.d rC30, rC30, ra3, rb0
2531
madd.d rC01, rC01, ra0, rb1
2532
sdc1 rC00, -CMUL(32)(pC0)
2533
madd.d rC11, rC11, ra1, rb1
2534
sdc1 rC10, -CMUL(24)(pC0)
2535
madd.d rC21, rC21, ra2, rb1
2536
sdc1 rC20, -CMUL(16)(pC0)
2537
madd.d rC31, rC31, ra3, rb1
2538
sdc1 rC30, -CMUL(8)(pC0)
2539
madd.d rC02, rC02, ra0, rb2
2540
sdc1 rC01, -CMUL(32)(pC1)
2541
madd.d rC12, rC12, ra1, rb2
2542
sdc1 rC11, -CMUL(24)(pC1)
2543
madd.d rC22, rC22, ra2, rb2
2544
sdc1 rC21, -CMUL(16)(pC1)
2545
madd.d rC32, rC32, ra3, rb2
2546
sdc1 rC31, -CMUL(8)(pC1)
2547
madd.d rC03, rC03, ra0, rb3
2548
sdc1 rC02, -CMUL(32)(pC2)
2549
madd.d rC13, rC13, ra1, rb3
2550
sdc1 rC12, -CMUL(24)(pC2)
2551
madd.d rC23, rC23, ra2, rb3
2552
sdc1 rC22, -CMUL(16)(pC2)
2553
madd.d rC33, rC33, ra3, rb3
2554
sdc1 rC32, -CMUL(8)(pC2)
2555
sdc1 rC03, -CMUL(32)(pC3)
2556
sdc1 rC13, -CMUL(24)(pC3)
2557
sdc1 rC23, -CMUL(16)(pC3)
2558
bne pA0, stAm, MLOOP
2559
sdc1 rC33, -CMUL(8)(pC3)
2561
dsubu pA0, pA0, incAn
2562
dsubu pA1, pA1, incAn
2563
dsubu pA2, pA2, incAn
2564
dsubu pA3, pA3, incAn
2565
daddu pC0, pC0, incCn
2566
daddu pC1, pC1, incCn
2567
daddu pC2, pC2, incCn
2568
daddu pC3, pC3, incCn
2569
daddu pB0, pB0, incBn
2570
daddu pB1, pB1, incBn
2571
daddu pB2, pB2, incBn
2572
bne pB0, stBn, NLOOP
2573
daddu pB3, pB3, incBn /* delay slot! */
2576
* Epilogue: restore registers and return
2587
#ifdef ATL_USE64BITS
2605
daddiu $sp, $sp, FSIZE /* delay slot of return statement */
2607
/* end of file MIPS assembler BS */
2612
.size ATL_USERMM,.-ATL_USERMM