2
* Automatically Tuned Linear Algebra Software v3.8.4
2
* Automatically Tuned Linear Algebra Software v3.10.1
3
3
* (C) Copyright 1999 R. Clint Whaley
5
5
* Redistribution and use in source and binary forms, with or without
169
169
int Mjoin(PATL,NCmmIJK)
170
170
(const enum ATLAS_TRANS TA, const enum ATLAS_TRANS TB,
171
171
const int M, const int N, const int K, const SCALAR alpha,
172
const TYPE *A, const int lda, const TYPE *B, const int ldb,
173
const SCALAR beta, TYPE *C, const int ldc)
172
const TYPE *A, const int lda0, const TYPE *B, const int ldb0,
173
const SCALAR beta, TYPE *C, const int ldc0)
175
175
* IJK loop-ordered matmul with no matrix copy
178
size_t incAk, incAm, incAn, incBk, incBm, incBn;
179
const size_t lda=lda0, ldb=ldb0, ldc=ldc0;
178
180
const int Mb = M / MB, Nb = N / NB, Kb = K / KB;
179
181
const int mr = M - Mb*MB, nr = N - Nb*NB, kr = K - Kb*KB;
180
int incAk, incAm, incAn, incBk, incBm, incBn;
181
const int incCn = ldc*NB, incCm = MB - Nb * incCn;
182
const size_t incCn = ldc*NB, incCm = MB - Nb * incCn;
182
183
const int BetaIsZero = (beta == ATL_rzero);
184
185
const TYPE *a=A, *b=B;