/*size_t i; size_t j; size_t max_dim = lda*lda; if (coreid==0){ for (i=0; i