static int spmv_kernel(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n, FLOAT *dummy1, FLOAT *buffer, BLASLONG pos){
FLOAT *a, *x, *y;
- BLASLONG incx, incy;
+ BLASLONG incx;
BLASLONG m_from, m_to, i;
#ifndef COMPLEX
FLOAT result;
y = (FLOAT *)args -> c;
incx = args -> ldb;
- incy = args -> ldc;
m_from = 0;
m_to = args -> m;
static int syr_kernel(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n, FLOAT *dummy1, FLOAT *buffer, BLASLONG pos){
FLOAT *a, *x, *y;
- BLASLONG lda, incx, incy;
+ BLASLONG incx, incy;
BLASLONG i, m_from, m_to;
FLOAT alpha_r;
#ifdef COMPLEX
incx = args -> lda;
incy = args -> ldb;
- lda = args -> ldc;
alpha_r = *((FLOAT *)args -> alpha + 0);
#ifdef COMPLEX
BLASLONG incx;
BLASLONG i, m_from, m_to;
FLOAT alpha_r;
-#if defined(COMPLEX) && !defined(HER) && !defined(HERREV)
+#if defined(COMPLEX) && !defined(HEMV) && !defined(HEMVREV)
FLOAT alpha_i;
#endif
incx = args -> lda;
alpha_r = *((FLOAT *)args -> alpha + 0);
-#if defined(COMPLEX) && !defined(HER) && !defined(HERREV)
+#if defined(COMPLEX) && !defined(HEMV) && !defined(HEMVREV)
alpha_i = *((FLOAT *)args -> alpha + 1);
#endif
static int symv_kernel(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n, FLOAT *dummy1, FLOAT *buffer, BLASLONG pos){
FLOAT *a, *x, *y;
- BLASLONG lda, incx, incy;
+ BLASLONG lda, incx;
BLASLONG m_from, m_to;
a = (FLOAT *)args -> a;
lda = args -> lda;
incx = args -> ldb;
- incy = args -> ldc;
m_from = 0;
m_to = args -> m;
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG m, FLOAT *a, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
int CNAME(BLASLONG m, FLOAT *a, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
#if (TRANSA == 2) || (TRANSA == 4)
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) * COMPSIZE+ 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
#if (TRANSA == 2) || (TRANSA == 4)
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) * COMPSIZE + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
#if (TRANSA == 2) || (TRANSA == 4)
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) * COMPSIZE + 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *b, BLASLONG incb, void *buffer){
BLASLONG i;
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
BLASLONG length;
#if (TRANSA == 2) || (TRANSA == 4)
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + n * sizeof(FLOAT) * COMPSIZE+ 4095) & ~4095);
COPY_K(n, b, incb, buffer, 1);
}
#ifndef UNIT
FLOAT atemp1, atemp2, btemp1, btemp2;
#endif
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) * 2 + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
#ifndef UNIT
FLOAT atemp1, atemp2, btemp1, btemp2;
#endif
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) * 2 + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
#ifndef UNIT
FLOAT ar, ai, br, bi, ratio, den;
#endif
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) * 2 + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
#ifndef UNIT
FLOAT ar, ai, br, bi, ratio, den;
#endif
- FLOAT *gemvbuffer = (FLOAT *)buffer;
FLOAT *B = b;
if (incb != 1) {
B = buffer;
- gemvbuffer = (FLOAT *)(((BLASLONG)buffer + m * sizeof(FLOAT) * 2 + 4095) & ~4095);
COPY_K(m, b, incb, buffer, 1);
}
blas_queue_t queue[MAX_CPU_NUMBER];
BLASLONG range_M[MAX_CPU_NUMBER + 1], range_N[MAX_CPU_NUMBER + 1];
- BLASLONG procs, total_procs, num_cpu_m, num_cpu_n;
+ BLASLONG procs, num_cpu_m, num_cpu_n;
BLASLONG width, i, j;
BLASLONG divM, divN;
BLASLONG is, min_i, div_n;
BLASLONG i, current;
- BLASLONG l1stride, l2size;
+ BLASLONG l1stride;
#ifdef TIMING
BLASULONG rpcc_counter;
#endif
) return 0;
- l2size = GEMM_P * GEMM_Q;
-
#if 0
fprintf(stderr, "Thread[%ld] m_from : %ld m_to : %ld n_from : %ld n_to : %ld N_from : %ld N_to : %ld\n",
mypos, m_from, m_to, n_from, n_to, N_from, N_to);
n = n_to - n_from;
}
- if ((args -> m < nthreads * SWITCH_RATIO) || (args -> n < nthreads * SWITCH_RATIO)) {
+ if ((m < nthreads * SWITCH_RATIO) || (n < nthreads * SWITCH_RATIO)) {
GEMM_LOCAL(args, range_m, range_n, sa, sb, 0);
return 0;
}
} memory[NUM_BUFFERS];
static int memory_initialized = 0;
-static void gotoblas_memory_init(void);
/* Memory allocation routine */
/* procpos ... indicates where it comes from */