2
* Automatically Tuned Linear Algebra Software v3.8.4
2
* Automatically Tuned Linear Algebra Software v3.10.1
3
3
* (C) Copyright 1999 R. Clint Whaley
5
5
* Redistribution and use in source and binary forms, with or without
197
197
int Mjoin(PATL,NCmmJIK_c)
198
198
(const enum ATLAS_TRANS TA, const enum ATLAS_TRANS TB,
199
199
const int M, const int N, const int K, const SCALAR alpha,
200
const TYPE *A, const int lda, const TYPE *B, const int ldb,
201
const SCALAR beta, TYPE *C, const int ldc)
200
const TYPE *A, const int lda0, const TYPE *B, const int ldb0,
201
const SCALAR beta, TYPE *C, const int ldc0)
203
203
* JIK loop-ordered matmul with no matrix copy
206
const size_t lda=lda0, ldb=ldb0, ldc=ldc0;
207
size_t incAk, incAm, incAn, incBk, incBm, incBn;
206
208
const int Mb = M / MB, Nb = N / NB, Kb = K / KB;
207
209
const int mr = M - Mb*MB, nr = N - Nb*NB, kr = K - Kb*KB;
208
int incAk, incAm, incAn, incBk, incBm, incBn;
209
const int incCm = (MB<<1), incCn = (ldc*NB - M + mr)<<1;
210
const size_t incCm = (MB<<1), incCn = (ldc*NB - M + mr)<<1;
211
212
const TYPE *a=A, *b=B;
212
213
const TYPE ralpha = *alpha, rbeta = *beta;