/*
Genome-wide Efficient Mixed Model Association (GEMMA)
Copyright (C) 2011-2017, Xiang Zhou
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see .
*/
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include "gsl/gsl_blas.h"
#include "gsl/gsl_cdf.h"
#include "gsl/gsl_linalg.h"
#include "gsl/gsl_matrix.h"
#include "gsl/gsl_min.h"
#include "gsl/gsl_roots.h"
#include "gsl/gsl_vector.h"
#include "fastblas.h"
#include "gzstream.h"
#include "gemma_io.h"
#include "lapack.h"
#include "mathfunc.h"
#include "lmm.h"
#include "mvlmm.h"
using namespace std;
// In this file, X, Y are already transformed (i.e. UtX and UtY).
void MVLMM::CopyFromParam(PARAM &cPar) {
a_mode = cPar.a_mode;
d_pace = cPar.d_pace;
file_bfile = cPar.file_bfile;
file_geno = cPar.file_geno;
file_out = cPar.file_out;
path_out = cPar.path_out;
l_min = cPar.l_min;
l_max = cPar.l_max;
n_region = cPar.n_region;
p_nr = cPar.p_nr;
em_iter = cPar.em_iter;
nr_iter = cPar.nr_iter;
em_prec = cPar.em_prec;
nr_prec = cPar.nr_prec;
crt = cPar.crt;
Vg_remle_null = cPar.Vg_remle_null;
Ve_remle_null = cPar.Ve_remle_null;
Vg_mle_null = cPar.Vg_mle_null;
Ve_mle_null = cPar.Ve_mle_null;
time_UtX = 0.0;
time_opt = 0.0;
ni_total = cPar.ni_total;
ns_total = cPar.ns_total;
ni_test = cPar.ni_test;
ns_test = cPar.ns_test;
n_cvt = cPar.n_cvt;
n_ph = cPar.n_ph;
indicator_idv = cPar.indicator_idv;
indicator_snp = cPar.indicator_snp;
snpInfo = cPar.snpInfo;
return;
}
void MVLMM::CopyToParam(PARAM &cPar) {
cPar.time_UtX = time_UtX;
cPar.time_opt = time_opt;
cPar.Vg_remle_null = Vg_remle_null;
cPar.Ve_remle_null = Ve_remle_null;
cPar.Vg_mle_null = Vg_mle_null;
cPar.Ve_mle_null = Ve_mle_null;
cPar.VVg_remle_null = VVg_remle_null;
cPar.VVe_remle_null = VVe_remle_null;
cPar.VVg_mle_null = VVg_mle_null;
cPar.VVe_mle_null = VVe_mle_null;
cPar.beta_remle_null = beta_remle_null;
cPar.se_beta_remle_null = se_beta_remle_null;
cPar.beta_mle_null = beta_mle_null;
cPar.se_beta_mle_null = se_beta_mle_null;
cPar.logl_remle_H0 = logl_remle_H0;
cPar.logl_mle_H0 = logl_mle_H0;
return;
}
void MVLMM::WriteFiles() {
string file_str;
file_str = path_out + "/" + file_out;
file_str += ".assoc.txt";
ofstream outfile(file_str.c_str(), ofstream::out);
if (!outfile) {
cout << "error writing file: " << file_str.c_str() << endl;
return;
}
outfile << "chr"
<< "\t"
<< "rs"
<< "\t"
<< "ps"
<< "\t"
<< "n_miss"
<< "\t"
<< "allele1"
<< "\t"
<< "allele0"
<< "\t"
<< "af"
<< "\t";
for (size_t i = 0; i < n_ph; i++) {
outfile << "beta_" << i + 1 << "\t";
}
for (size_t i = 0; i < n_ph; i++) {
for (size_t j = i; j < n_ph; j++) {
outfile << "Vbeta_" << i + 1 << "_" << j + 1 << "\t";
}
}
if (a_mode == 1) {
outfile << "p_wald" << endl;
} else if (a_mode == 2) {
outfile << "p_lrt" << endl;
} else if (a_mode == 3) {
outfile << "p_score" << endl;
} else if (a_mode == 4) {
outfile << "p_wald"
<< "\t"
<< "p_lrt"
<< "\t"
<< "p_score" << endl;
} else {
}
size_t t = 0, c = 0;
for (size_t i = 0; i < snpInfo.size(); ++i) {
if (indicator_snp[i] == 0) {
continue;
}
outfile << snpInfo[i].chr << "\t" << snpInfo[i].rs_number << "\t"
<< snpInfo[i].base_position << "\t" << snpInfo[i].n_miss << "\t"
<< snpInfo[i].a_minor << "\t" << snpInfo[i].a_major << "\t" << fixed
<< setprecision(3) << snpInfo[i].maf << "\t";
outfile << scientific << setprecision(6);
for (size_t i = 0; i < n_ph; i++) {
outfile << sumStat[t].v_beta[i] << "\t";
}
c = 0;
for (size_t i = 0; i < n_ph; i++) {
for (size_t j = i; j < n_ph; j++) {
outfile << sumStat[t].v_Vbeta[c] << "\t";
c++;
}
}
if (a_mode == 1) {
outfile << sumStat[t].p_wald << endl;
} else if (a_mode == 2) {
outfile << sumStat[t].p_lrt << endl;
} else if (a_mode == 3) {
outfile << sumStat[t].p_score << endl;
} else if (a_mode == 4) {
outfile << sumStat[t].p_wald << "\t" << sumStat[t].p_lrt << "\t"
<< sumStat[t].p_score << endl;
} else {
}
t++;
}
outfile.close();
outfile.clear();
return;
}
// Below are functions for EM algorithm.
double EigenProc(const gsl_matrix *V_g, const gsl_matrix *V_e, gsl_vector *D_l,
gsl_matrix *UltVeh, gsl_matrix *UltVehi) {
size_t d_size = V_g->size1;
double d, logdet_Ve = 0.0;
// Eigen decomposition of V_e.
gsl_matrix *Lambda = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_temp = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_h = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_hi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *VgVehi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *U_l = gsl_matrix_alloc(d_size, d_size);
gsl_matrix_memcpy(V_e_temp, V_e);
EigenDecomp(V_e_temp, U_l, D_l, 0);
// Calculate V_e_h and V_e_hi.
gsl_matrix_set_zero(V_e_h);
gsl_matrix_set_zero(V_e_hi);
for (size_t i = 0; i < d_size; i++) {
d = gsl_vector_get(D_l, i);
if (d <= 0) {
continue;
}
logdet_Ve += safe_log(d);
gsl_vector_view U_col = gsl_matrix_column(U_l, i);
d = safe_sqrt(d);
gsl_blas_dsyr(CblasUpper, d, &U_col.vector, V_e_h);
d = 1.0 / d;
gsl_blas_dsyr(CblasUpper, d, &U_col.vector, V_e_hi);
}
// Copy the upper part to lower part.
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < i; j++) {
gsl_matrix_set(V_e_h, i, j, gsl_matrix_get(V_e_h, j, i));
gsl_matrix_set(V_e_hi, i, j, gsl_matrix_get(V_e_hi, j, i));
}
}
// Calculate Lambda=V_ehi V_g V_ehi.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, V_g, V_e_hi, 0.0, VgVehi);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, V_e_hi, VgVehi, 0.0, Lambda);
// Eigen decomposition of Lambda.
EigenDecomp(Lambda, U_l, D_l, 0);
for (size_t i = 0; i < d_size; i++) {
d = gsl_vector_get(D_l, i);
if (d < 0) {
gsl_vector_set(D_l, i, 0);
}
}
// Calculate UltVeh and UltVehi.
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, U_l, V_e_h, 0.0, UltVeh);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, U_l, V_e_hi, 0.0, UltVehi);
// free memory
gsl_matrix_free(Lambda);
gsl_matrix_free(V_e_temp);
gsl_matrix_free(V_e_h);
gsl_matrix_free(V_e_hi);
gsl_matrix_free(VgVehi);
gsl_matrix_free(U_l);
return logdet_Ve;
}
// Qi=(\sum_{k=1}^n x_kx_k^T\otimes(delta_k*Dl+I)^{-1} )^{-1}.
double CalcQi(const gsl_vector *eval, const gsl_vector *D_l,
const gsl_matrix *X, gsl_matrix *Qi) {
size_t n_size = eval->size, d_size = D_l->size, dc_size = Qi->size1;
size_t c_size = dc_size / d_size;
double delta, dl, d1, d2, d, logdet_Q;
gsl_matrix *Q = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix_set_zero(Q);
for (size_t i = 0; i < c_size; i++) {
for (size_t j = 0; j < c_size; j++) {
for (size_t l = 0; l < d_size; l++) {
dl = gsl_vector_get(D_l, l);
if (j < i) {
d = gsl_matrix_get(Q, j * d_size + l, i * d_size + l);
} else {
d = 0.0;
for (size_t k = 0; k < n_size; k++) {
d1 = gsl_matrix_get(X, i, k);
d2 = gsl_matrix_get(X, j, k);
delta = gsl_vector_get(eval, k);
d += d1 * d2 / (dl * delta + 1.0); // @@
}
}
gsl_matrix_set(Q, i * d_size + l, j * d_size + l, d);
}
}
}
// Calculate LU decomposition of Q, and invert Q and calculate |Q|.
int sig;
gsl_permutation *pmt = gsl_permutation_alloc(dc_size);
LUDecomp(Q, pmt, &sig);
LUInvert(Q, pmt, Qi);
logdet_Q = LULndet(Q);
gsl_matrix_free(Q);
gsl_permutation_free(pmt);
return logdet_Q;
}
// xHiy=\sum_{k=1}^n x_k\otimes ((delta_k*Dl+I)^{-1}Ul^TVe^{-1/2}y.
//
// FIXME: mvlmm spends a massive amount of time here
void CalcXHiY(const gsl_vector *eval, const gsl_vector *D_l,
const gsl_matrix *X, const gsl_matrix *UltVehiY,
gsl_vector *xHiy) {
// debug_msg("enter");
size_t n_size = eval->size, c_size = X->size1, d_size = D_l->size;
// gsl_vector_set_zero(xHiy);
double x, delta, dl, y, d;
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
for (size_t j = 0; j < c_size; j++) {
d = 0.0;
for (size_t k = 0; k < n_size; k++) {
x = gsl_matrix_get(X, j, k);
y = gsl_matrix_get(UltVehiY, i, k);
delta = gsl_vector_get(eval, k);
d += x * y / (delta * dl + 1.0);
}
gsl_vector_set(xHiy, j * d_size + i, d);
}
}
// debug_msg("exit");
return;
}
// OmegaU=D_l/(delta Dl+I)^{-1}
// OmegaE=delta D_l/(delta Dl+I)^{-1}
void CalcOmega(const gsl_vector *eval, const gsl_vector *D_l,
gsl_matrix *OmegaU, gsl_matrix *OmegaE) {
size_t n_size = eval->size, d_size = D_l->size;
double delta, dl, d_u, d_e;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
d_u = dl / (delta * dl + 1.0); // @@
d_e = delta * d_u;
gsl_matrix_set(OmegaU, i, k, d_u);
gsl_matrix_set(OmegaE, i, k, d_e);
}
}
return;
}
void UpdateU(const gsl_matrix *OmegaE, const gsl_matrix *UltVehiY,
const gsl_matrix *UltVehiBX, gsl_matrix *UltVehiU) {
gsl_matrix_memcpy(UltVehiU, UltVehiY);
gsl_matrix_sub(UltVehiU, UltVehiBX);
gsl_matrix_mul_elements(UltVehiU, OmegaE);
return;
}
void UpdateE(const gsl_matrix *UltVehiY, const gsl_matrix *UltVehiBX,
const gsl_matrix *UltVehiU, gsl_matrix *UltVehiE) {
gsl_matrix_memcpy(UltVehiE, UltVehiY);
gsl_matrix_sub(UltVehiE, UltVehiBX);
gsl_matrix_sub(UltVehiE, UltVehiU);
return;
}
void UpdateL_B(const gsl_matrix *X, const gsl_matrix *XXti,
const gsl_matrix *UltVehiY, const gsl_matrix *UltVehiU,
gsl_matrix *UltVehiBX, gsl_matrix *UltVehiB) {
size_t c_size = X->size1, d_size = UltVehiY->size1;
gsl_matrix *YUX = gsl_matrix_alloc(d_size, c_size);
gsl_matrix_memcpy(UltVehiBX, UltVehiY);
gsl_matrix_sub(UltVehiBX, UltVehiU);
gsl_blas_dgemm(CblasNoTrans, CblasTrans, 1.0, UltVehiBX, X, 0.0, YUX);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, YUX, XXti, 0.0, UltVehiB);
gsl_matrix_free(YUX);
return;
}
void UpdateRL_B(const gsl_vector *xHiy, const gsl_matrix *Qi,
gsl_matrix *UltVehiB) {
size_t d_size = UltVehiB->size1, c_size = UltVehiB->size2,
dc_size = Qi->size1;
gsl_vector *b = gsl_vector_alloc(dc_size);
// Calculate b=Qiv.
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, xHiy, 0.0, b);
// Copy b to UltVehiB.
for (size_t i = 0; i < c_size; i++) {
gsl_vector_view UltVehiB_col = gsl_matrix_column(UltVehiB, i);
gsl_vector_const_view b_subcol =
gsl_vector_const_subvector(b, i * d_size, d_size);
gsl_vector_memcpy(&UltVehiB_col.vector, &b_subcol.vector);
}
gsl_vector_free(b);
return;
}
void UpdateV(const gsl_vector *eval, const gsl_matrix *U, const gsl_matrix *E,
const gsl_matrix *Sigma_uu, const gsl_matrix *Sigma_ee,
gsl_matrix *V_g, gsl_matrix *V_e) {
size_t n_size = eval->size, d_size = U->size1;
gsl_matrix_set_zero(V_g);
gsl_matrix_set_zero(V_e);
double delta;
// Calculate the first part: UD^{-1}U^T and EE^T.
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
if (delta == 0) {
continue;
}
gsl_vector_const_view U_col = gsl_matrix_const_column(U, k);
gsl_blas_dsyr(CblasUpper, 1.0 / delta, &U_col.vector, V_g);
}
gsl_blas_dsyrk(CblasUpper, CblasNoTrans, 1.0, E, 0.0, V_e);
// Copy the upper part to lower part.
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < i; j++) {
gsl_matrix_set(V_g, i, j, gsl_matrix_get(V_g, j, i));
gsl_matrix_set(V_e, i, j, gsl_matrix_get(V_e, j, i));
}
}
// Add Sigma.
gsl_matrix_add(V_g, Sigma_uu);
gsl_matrix_add(V_e, Sigma_ee);
// Scale by 1/n.
gsl_matrix_scale(V_g, 1.0 / (double)n_size);
gsl_matrix_scale(V_e, 1.0 / (double)n_size);
return;
}
void CalcSigma(const char func_name, const gsl_vector *eval,
const gsl_vector *D_l, const gsl_matrix *X,
const gsl_matrix *OmegaU, const gsl_matrix *OmegaE,
const gsl_matrix *UltVeh, const gsl_matrix *Qi,
gsl_matrix *Sigma_uu, gsl_matrix *Sigma_ee) {
if (func_name != 'R' && func_name != 'L' && func_name != 'r' &&
func_name != 'l') {
cout << "func_name only takes 'R' or 'L': 'R' for log-restricted "
<< "likelihood, 'L' for log-likelihood." << endl;
return;
}
size_t n_size = eval->size, c_size = X->size1;
size_t d_size = D_l->size, dc_size = Qi->size1;
gsl_matrix_set_zero(Sigma_uu);
gsl_matrix_set_zero(Sigma_ee);
double delta, dl, x, d;
// Calculate the first diagonal term.
gsl_vector_view Suu_diag = gsl_matrix_diagonal(Sigma_uu);
gsl_vector_view See_diag = gsl_matrix_diagonal(Sigma_ee);
for (size_t k = 0; k < n_size; k++) {
gsl_vector_const_view OmegaU_col = gsl_matrix_const_column(OmegaU, k);
gsl_vector_const_view OmegaE_col = gsl_matrix_const_column(OmegaE, k);
gsl_vector_add(&Suu_diag.vector, &OmegaU_col.vector);
gsl_vector_add(&See_diag.vector, &OmegaE_col.vector);
}
// Calculate the second term for REML.
if (func_name == 'R' || func_name == 'r') {
gsl_matrix *M_u = gsl_matrix_alloc(dc_size, d_size);
gsl_matrix *M_e = gsl_matrix_alloc(dc_size, d_size);
gsl_matrix *QiM = gsl_matrix_alloc(dc_size, d_size);
gsl_matrix_set_zero(M_u);
gsl_matrix_set_zero(M_e);
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
for (size_t j = 0; j < c_size; j++) {
x = gsl_matrix_get(X, j, k);
d = x / (delta * dl + 1.0);
gsl_matrix_set(M_e, j * d_size + i, i, d);
gsl_matrix_set(M_u, j * d_size + i, i, d * dl);
}
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, M_u, 0.0, QiM);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, delta, M_u, QiM, 1.0, Sigma_uu);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, M_e, 0.0, QiM);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, M_e, QiM, 1.0, Sigma_ee);
}
gsl_matrix_free(M_u);
gsl_matrix_free(M_e);
gsl_matrix_free(QiM);
}
// Multiply both sides by VehUl.
gsl_matrix *M = gsl_matrix_alloc(d_size, d_size);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Sigma_uu, UltVeh, 0.0, M);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, M, 0.0, Sigma_uu);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Sigma_ee, UltVeh, 0.0, M);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, M, 0.0, Sigma_ee);
gsl_matrix_free(M);
return;
}
// 'R' for restricted likelihood and 'L' for likelihood.
// 'R' update B and 'L' don't.
// only calculate -0.5*\sum_{k=1}^n|H_k|-0.5yPxy.
double MphCalcLogL(const gsl_vector *eval, const gsl_vector *xHiy,
const gsl_vector *D_l, const gsl_matrix *UltVehiY,
const gsl_matrix *Qi) {
size_t n_size = eval->size, d_size = D_l->size, dc_size = Qi->size1;
double logl = 0.0, delta, dl, y, d;
// Calculate yHiy+log|H_k|.
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
for (size_t i = 0; i < d_size; i++) {
y = gsl_matrix_get(UltVehiY, i, k);
dl = gsl_vector_get(D_l, i);
d = delta * dl + 1.0;
logl += y * y / d + safe_log(d);
}
}
// Calculate the rest of yPxy.
gsl_vector *Qiv = gsl_vector_alloc(dc_size);
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, xHiy, 0.0, Qiv);
gsl_blas_ddot(xHiy, Qiv, &d);
logl -= d;
gsl_vector_free(Qiv);
return -0.5 * logl;
}
// Y is a dxn matrix, X is a cxn matrix, B is a dxc matrix, V_g is a
// dxd matrix, V_e is a dxd matrix, eval is a size n vector
//'R' for restricted likelihood and 'L' for likelihood.
double MphEM(const char func_name, const size_t max_iter, const double max_prec,
const gsl_vector *eval, const gsl_matrix *X, const gsl_matrix *Y,
gsl_matrix *U_hat, gsl_matrix *E_hat, gsl_matrix *OmegaU,
gsl_matrix *OmegaE, gsl_matrix *UltVehiY, gsl_matrix *UltVehiBX,
gsl_matrix *UltVehiU, gsl_matrix *UltVehiE, gsl_matrix *V_g,
gsl_matrix *V_e, gsl_matrix *B) {
if (func_name != 'R' && func_name != 'L' && func_name != 'r' &&
func_name != 'l') {
cout << "func_name only takes 'R' or 'L': 'R' for log-restricted "
<< "likelihood, 'L' for log-likelihood." << endl;
return 0.0;
}
size_t n_size = eval->size, c_size = X->size1, d_size = Y->size1;
size_t dc_size = d_size * c_size;
gsl_matrix *XXt = gsl_matrix_alloc(c_size, c_size);
gsl_matrix *XXti = gsl_matrix_alloc(c_size, c_size);
gsl_vector *D_l = gsl_vector_alloc(d_size);
gsl_matrix *UltVeh = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehiB = gsl_matrix_alloc(d_size, c_size);
gsl_matrix *Qi = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *Sigma_uu = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *Sigma_ee = gsl_matrix_alloc(d_size, d_size);
gsl_vector *xHiy = gsl_vector_alloc(dc_size);
gsl_permutation *pmt = gsl_permutation_alloc(c_size);
double logl_const = 0.0, logl_old = 0.0, logl_new = 0.0;
double logdet_Q, logdet_Ve;
int sig;
// Calculate |XXt| and (XXt)^{-1}.
gsl_blas_dsyrk(CblasUpper, CblasNoTrans, 1.0, X, 0.0, XXt);
for (size_t i = 0; i < c_size; ++i) {
for (size_t j = 0; j < i; ++j) {
gsl_matrix_set(XXt, i, j, gsl_matrix_get(XXt, j, i));
}
}
LUDecomp(XXt, pmt, &sig);
LUInvert(XXt, pmt, XXti);
// Calculate the constant for logl.
if (func_name == 'R' || func_name == 'r') {
logl_const =
-0.5 * (double)(n_size - c_size) * (double)d_size * safe_log(2.0 * M_PI) +
0.5 * (double)d_size * LULndet(XXt);
} else {
logl_const = -0.5 * (double)n_size * (double)d_size * safe_log(2.0 * M_PI);
}
// Start EM.
for (size_t t = 0; t < max_iter; t++) {
logdet_Ve = EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
logdet_Q = CalcQi(eval, D_l, X, Qi);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehi, Y, 0.0, UltVehiY);
CalcXHiY(eval, D_l, X, UltVehiY, xHiy);
// Calculate log likelihood/restricted likelihood value, and
// terminate if change is small.
logl_new = logl_const + MphCalcLogL(eval, xHiy, D_l, UltVehiY, Qi) -
0.5 * (double)n_size * logdet_Ve;
if (func_name == 'R' || func_name == 'r') {
logl_new += -0.5 * (logdet_Q - (double)c_size * logdet_Ve);
}
if (t != 0 && abs(logl_new - logl_old) < max_prec) {
break;
}
logl_old = logl_new;
CalcOmega(eval, D_l, OmegaU, OmegaE);
// Update UltVehiB, UltVehiU.
if (func_name == 'R' || func_name == 'r') {
UpdateRL_B(xHiy, Qi, UltVehiB);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehiB, X, 0.0,
UltVehiBX);
} else if (t == 0) {
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehi, B, 0.0,
UltVehiB);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehiB, X, 0.0,
UltVehiBX);
}
UpdateU(OmegaE, UltVehiY, UltVehiBX, UltVehiU);
if (func_name == 'L' || func_name == 'l') {
// UltVehiBX is destroyed here.
UpdateL_B(X, XXti, UltVehiY, UltVehiU, UltVehiBX, UltVehiB);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehiB, X, 0.0,
UltVehiBX);
}
UpdateE(UltVehiY, UltVehiBX, UltVehiU, UltVehiE);
// Calculate U_hat, E_hat and B.
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, UltVehiU, 0.0, U_hat);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, UltVehiE, 0.0, E_hat);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, UltVehiB, 0.0, B);
// Calculate Sigma_uu and Sigma_ee.
CalcSigma(func_name, eval, D_l, X, OmegaU, OmegaE, UltVeh, Qi, Sigma_uu,
Sigma_ee);
// Update V_g and V_e.
UpdateV(eval, U_hat, E_hat, Sigma_uu, Sigma_ee, V_g, V_e);
}
gsl_matrix_free(XXt);
gsl_matrix_free(XXti);
gsl_vector_free(D_l);
gsl_matrix_free(UltVeh);
gsl_matrix_free(UltVehi);
gsl_matrix_free(UltVehiB);
gsl_matrix_free(Qi);
gsl_matrix_free(Sigma_uu);
gsl_matrix_free(Sigma_ee);
gsl_vector_free(xHiy);
gsl_permutation_free(pmt);
return logl_new;
}
// Calculate p-value, beta (d by 1 vector) and V(beta).
double MphCalcP(const gsl_vector *eval, const gsl_vector *x_vec,
const gsl_matrix *W, const gsl_matrix *Y, const gsl_matrix *V_g,
const gsl_matrix *V_e, gsl_matrix *UltVehiY, gsl_vector *beta,
gsl_matrix *Vbeta) {
size_t n_size = eval->size, c_size = W->size1, d_size = V_g->size1;
size_t dc_size = d_size * c_size;
double delta, dl, d, d1, d2, dy, dx, dw; // logdet_Ve, logdet_Q, p_value;
gsl_vector *D_l = gsl_vector_alloc(d_size);
gsl_matrix *UltVeh = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *Qi = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *WHix = gsl_matrix_alloc(dc_size, d_size);
gsl_matrix *QiWHix = gsl_matrix_alloc(dc_size, d_size);
gsl_matrix *xPx = gsl_matrix_alloc(d_size, d_size);
gsl_vector *xPy = gsl_vector_alloc(d_size);
gsl_vector *WHiy = gsl_vector_alloc(dc_size);
gsl_matrix_set_zero(xPx);
gsl_matrix_set_zero(WHix);
gsl_vector_set_zero(xPy);
gsl_vector_set_zero(WHiy);
// Eigen decomposition and calculate log|Ve|.
// double logdet_Ve = EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
// Calculate Qi and log|Q|.
// double logdet_Q = CalcQi(eval, D_l, W, Qi);
CalcQi(eval, D_l, W, Qi);
// Calculate UltVehiY.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehi, Y, 0.0, UltVehiY);
// Calculate WHix, WHiy, xHiy, xHix.
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
d1 = 0.0;
d2 = 0.0;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
dx = gsl_vector_get(x_vec, k);
dy = gsl_matrix_get(UltVehiY, i, k);
d1 += dx * dy / (delta * dl + 1.0);
d2 += dx * dx / (delta * dl + 1.0);
}
gsl_vector_set(xPy, i, d1);
gsl_matrix_set(xPx, i, i, d2);
for (size_t j = 0; j < c_size; j++) {
d1 = 0.0;
d2 = 0.0;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
dx = gsl_vector_get(x_vec, k);
dw = gsl_matrix_get(W, j, k);
dy = gsl_matrix_get(UltVehiY, i, k);
d1 += dx * dw / (delta * dl + 1.0);
d2 += dy * dw / (delta * dl + 1.0);
}
gsl_matrix_set(WHix, j * d_size + i, i, d1);
gsl_vector_set(WHiy, j * d_size + i, d2);
}
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, WHix, 0.0, QiWHix);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, -1.0, WHix, QiWHix, 1.0, xPx);
gsl_blas_dgemv(CblasTrans, -1.0, QiWHix, WHiy, 1.0, xPy);
// Calculate V(beta) and beta.
int sig;
gsl_permutation *pmt = gsl_permutation_alloc(d_size);
LUDecomp(xPx, pmt, &sig);
LUSolve(xPx, pmt, xPy, D_l);
LUInvert(xPx, pmt, Vbeta);
// Need to multiply UltVehi on both sides or one side.
gsl_blas_dgemv(CblasTrans, 1.0, UltVeh, D_l, 0.0, beta);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Vbeta, UltVeh, 0.0, xPx);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, xPx, 0.0, Vbeta);
// Calculate test statistic and p value.
gsl_blas_ddot(D_l, xPy, &d);
double p_value = gsl_cdf_chisq_Q(d, (double)d_size);
gsl_vector_free(D_l);
gsl_matrix_free(UltVeh);
gsl_matrix_free(UltVehi);
gsl_matrix_free(Qi);
gsl_matrix_free(WHix);
gsl_matrix_free(QiWHix);
gsl_matrix_free(xPx);
gsl_vector_free(xPy);
gsl_vector_free(WHiy);
gsl_permutation_free(pmt);
return p_value;
}
// Calculate B and its standard error (which is a matrix of the same
// dimension as B).
void MphCalcBeta(const gsl_vector *eval, const gsl_matrix *W,
const gsl_matrix *Y, const gsl_matrix *V_g,
const gsl_matrix *V_e, gsl_matrix *UltVehiY, gsl_matrix *B,
gsl_matrix *se_B) {
size_t n_size = eval->size, c_size = W->size1, d_size = V_g->size1;
size_t dc_size = d_size * c_size;
double delta, dl, d, dy, dw; // , logdet_Ve, logdet_Q;
gsl_vector *D_l = gsl_vector_alloc(d_size);
gsl_matrix *UltVeh = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *Qi = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *Qi_temp = gsl_matrix_alloc(dc_size, dc_size);
gsl_vector *WHiy = gsl_vector_alloc(dc_size);
gsl_vector *QiWHiy = gsl_vector_alloc(dc_size);
gsl_vector *beta = gsl_vector_alloc(dc_size);
gsl_matrix *Vbeta = gsl_matrix_alloc(dc_size, dc_size);
gsl_vector_set_zero(WHiy);
// Eigen decomposition and calculate log|Ve|.
// double logdet_Ve = EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
// Calculate Qi and log|Q|.
// double logdet_Q = CalcQi(eval, D_l, W, Qi);
CalcQi(eval, D_l, W, Qi);
// Calculate UltVehiY.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehi, Y, 0.0, UltVehiY);
// Calculate WHiy.
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
for (size_t j = 0; j < c_size; j++) {
d = 0.0;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
dw = gsl_matrix_get(W, j, k);
dy = gsl_matrix_get(UltVehiY, i, k);
d += dy * dw / (delta * dl + 1.0);
}
gsl_vector_set(WHiy, j * d_size + i, d);
}
}
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, WHiy, 0.0, QiWHiy);
// Need to multiply I_c\otimes UltVehi on both sides or one side.
for (size_t i = 0; i < c_size; i++) {
gsl_vector_view QiWHiy_sub =
gsl_vector_subvector(QiWHiy, i * d_size, d_size);
gsl_vector_view beta_sub = gsl_vector_subvector(beta, i * d_size, d_size);
gsl_blas_dgemv(CblasTrans, 1.0, UltVeh, &QiWHiy_sub.vector, 0.0,
&beta_sub.vector);
for (size_t j = 0; j < c_size; j++) {
gsl_matrix_view Qi_sub =
gsl_matrix_submatrix(Qi, i * d_size, j * d_size, d_size, d_size);
gsl_matrix_view Qitemp_sub =
gsl_matrix_submatrix(Qi_temp, i * d_size, j * d_size, d_size, d_size);
gsl_matrix_view Vbeta_sub =
gsl_matrix_submatrix(Vbeta, i * d_size, j * d_size, d_size, d_size);
if (j < i) {
gsl_matrix_view Vbeta_sym =
gsl_matrix_submatrix(Vbeta, j * d_size, i * d_size, d_size, d_size);
gsl_matrix_transpose_memcpy(&Vbeta_sub.matrix, &Vbeta_sym.matrix);
} else {
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &Qi_sub.matrix, UltVeh,
0.0, &Qitemp_sub.matrix);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh,
&Qitemp_sub.matrix, 0.0, &Vbeta_sub.matrix);
}
}
}
// Copy beta to B, and Vbeta to se_B.
for (size_t j = 0; j < B->size2; j++) {
for (size_t i = 0; i < B->size1; i++) {
gsl_matrix_set(B, i, j, gsl_vector_get(beta, j * d_size + i));
gsl_matrix_set(se_B, i, j, safe_sqrt(gsl_matrix_get(Vbeta, j * d_size + i,
j * d_size + i)));
}
}
// Free matrices.
gsl_vector_free(D_l);
gsl_matrix_free(UltVeh);
gsl_matrix_free(UltVehi);
gsl_matrix_free(Qi);
gsl_matrix_free(Qi_temp);
gsl_vector_free(WHiy);
gsl_vector_free(QiWHiy);
gsl_vector_free(beta);
gsl_matrix_free(Vbeta);
return;
}
// Below are functions for Newton-Raphson's algorithm.
// Calculate all Hi and return logdet_H=\sum_{k=1}^{n}log|H_k|
// and calculate Qi and return logdet_Q
// and calculate yPy.
void CalcHiQi(const gsl_vector *eval, const gsl_matrix *X,
const gsl_matrix *V_g, const gsl_matrix *V_e, gsl_matrix *Hi_all,
gsl_matrix *Qi, double &logdet_H, double &logdet_Q) {
gsl_matrix_set_zero(Hi_all);
gsl_matrix_set_zero(Qi);
logdet_H = 0.0;
logdet_Q = 0.0;
size_t n_size = eval->size, c_size = X->size1, d_size = V_g->size1;
double logdet_Ve = 0.0, delta, dl, d;
gsl_matrix *mat_dd = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVeh = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehi = gsl_matrix_alloc(d_size, d_size);
gsl_vector *D_l = gsl_vector_alloc(d_size);
// Calculate D_l, UltVeh and UltVehi.
logdet_Ve = EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
// Calculate each Hi and log|H_k|.
logdet_H = (double)n_size * logdet_Ve;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
gsl_matrix_memcpy(mat_dd, UltVehi);
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
d = delta * dl + 1.0;
gsl_vector_view mat_row = gsl_matrix_row(mat_dd, i);
gsl_vector_scale(&mat_row.vector, 1.0 / d); // @@
logdet_H += safe_log(d);
}
gsl_matrix_view Hi_k =
gsl_matrix_submatrix(Hi_all, 0, k * d_size, d_size, d_size);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVehi, mat_dd, 0.0,
&Hi_k.matrix);
}
// Calculate Qi, and multiply I\o times UtVeh on both side and
// calculate logdet_Q, don't forget to substract
// c_size*logdet_Ve.
logdet_Q = CalcQi(eval, D_l, X, Qi) - (double)c_size * logdet_Ve;
for (size_t i = 0; i < c_size; i++) {
for (size_t j = 0; j < c_size; j++) {
gsl_matrix_view Qi_sub =
gsl_matrix_submatrix(Qi, i * d_size, j * d_size, d_size, d_size);
if (j < i) {
gsl_matrix_view Qi_sym =
gsl_matrix_submatrix(Qi, j * d_size, i * d_size, d_size, d_size);
gsl_matrix_transpose_memcpy(&Qi_sub.matrix, &Qi_sym.matrix);
} else {
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &Qi_sub.matrix, UltVeh,
0.0, mat_dd);
gsl_blas_dgemm(CblasTrans, CblasNoTrans, 1.0, UltVeh, mat_dd, 0.0,
&Qi_sub.matrix);
}
}
}
// Free memory.
gsl_matrix_free(mat_dd);
gsl_matrix_free(UltVeh);
gsl_matrix_free(UltVehi);
gsl_vector_free(D_l);
return;
}
// Calculate all Hiy.
void Calc_Hiy_all(const gsl_matrix *Y, const gsl_matrix *Hi_all,
gsl_matrix *Hiy_all) {
gsl_matrix_set_zero(Hiy_all);
size_t n_size = Y->size2, d_size = Y->size1;
for (size_t k = 0; k < n_size; k++) {
gsl_matrix_const_view Hi_k =
gsl_matrix_const_submatrix(Hi_all, 0, k * d_size, d_size, d_size);
gsl_vector_const_view y_k = gsl_matrix_const_column(Y, k);
gsl_vector_view Hiy_k = gsl_matrix_column(Hiy_all, k);
gsl_blas_dgemv(CblasNoTrans, 1.0, &Hi_k.matrix, &y_k.vector, 0.0,
&Hiy_k.vector);
}
return;
}
// Calculate all xHi.
void Calc_xHi_all(const gsl_matrix *X, const gsl_matrix *Hi_all,
gsl_matrix *xHi_all) {
gsl_matrix_set_zero(xHi_all);
size_t n_size = X->size2, c_size = X->size1, d_size = Hi_all->size1;
double d;
for (size_t k = 0; k < n_size; k++) {
gsl_matrix_const_view Hi_k =
gsl_matrix_const_submatrix(Hi_all, 0, k * d_size, d_size, d_size);
for (size_t i = 0; i < c_size; i++) {
d = gsl_matrix_get(X, i, k);
gsl_matrix_view xHi_sub =
gsl_matrix_submatrix(xHi_all, i * d_size, k * d_size, d_size, d_size);
gsl_matrix_memcpy(&xHi_sub.matrix, &Hi_k.matrix);
gsl_matrix_scale(&xHi_sub.matrix, d);
}
}
return;
}
// Calculate scalar yHiy.
double Calc_yHiy(const gsl_matrix *Y, const gsl_matrix *Hiy_all) {
double yHiy = 0.0, d;
size_t n_size = Y->size2;
for (size_t k = 0; k < n_size; k++) {
gsl_vector_const_view y_k = gsl_matrix_const_column(Y, k);
gsl_vector_const_view Hiy_k = gsl_matrix_const_column(Hiy_all, k);
gsl_blas_ddot(&Hiy_k.vector, &y_k.vector, &d);
yHiy += d;
}
return yHiy;
}
// Calculate the vector xHiy.
void Calc_xHiy(const gsl_matrix *Y, const gsl_matrix *xHi, gsl_vector *xHiy) {
gsl_vector_set_zero(xHiy);
size_t n_size = Y->size2, d_size = Y->size1, dc_size = xHi->size1;
for (size_t k = 0; k < n_size; k++) {
gsl_matrix_const_view xHi_k =
gsl_matrix_const_submatrix(xHi, 0, k * d_size, dc_size, d_size);
gsl_vector_const_view y_k = gsl_matrix_const_column(Y, k);
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHi_k.matrix, &y_k.vector, 1.0, xHiy);
}
return;
}
// 0<=i,j= d_size || j >= d_size) {
cout << "error in GetIndex." << endl;
return 0;
}
size_t s, l;
if (j < i) {
s = j;
l = i;
} else {
s = i;
l = j;
}
return (2 * d_size - s + 1) * s / 2 + l - s;
}
void Calc_yHiDHiy(const gsl_vector *eval, const gsl_matrix *Hiy, const size_t i,
const size_t j, double &yHiDHiy_g, double &yHiDHiy_e) {
yHiDHiy_g = 0.0;
yHiDHiy_e = 0.0;
size_t n_size = eval->size;
double delta, d1, d2;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
d1 = gsl_matrix_get(Hiy, i, k);
d2 = gsl_matrix_get(Hiy, j, k);
if (i == j) {
yHiDHiy_g += delta * d1 * d2;
yHiDHiy_e += d1 * d2;
} else {
yHiDHiy_g += delta * d1 * d2 * 2.0;
yHiDHiy_e += d1 * d2 * 2.0;
}
}
return;
}
void Calc_xHiDHiy(const gsl_vector *eval, const gsl_matrix *xHi,
const gsl_matrix *Hiy, const size_t i, const size_t j,
gsl_vector *xHiDHiy_g, gsl_vector *xHiDHiy_e) {
gsl_vector_set_zero(xHiDHiy_g);
gsl_vector_set_zero(xHiDHiy_e);
size_t n_size = eval->size, d_size = Hiy->size1;
double delta, d;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
gsl_vector_const_view xHi_col_i =
gsl_matrix_const_column(xHi, k * d_size + i);
d = gsl_matrix_get(Hiy, j, k);
gsl_blas_daxpy(d * delta, &xHi_col_i.vector, xHiDHiy_g);
gsl_blas_daxpy(d, &xHi_col_i.vector, xHiDHiy_e);
if (i != j) {
gsl_vector_const_view xHi_col_j =
gsl_matrix_const_column(xHi, k * d_size + j);
d = gsl_matrix_get(Hiy, i, k);
gsl_blas_daxpy(d * delta, &xHi_col_j.vector, xHiDHiy_g);
gsl_blas_daxpy(d, &xHi_col_j.vector, xHiDHiy_e);
}
}
return;
}
void Calc_xHiDHix(const gsl_vector *eval, const gsl_matrix *xHi, const size_t i,
const size_t j, gsl_matrix *xHiDHix_g,
gsl_matrix *xHiDHix_e) {
gsl_matrix_set_zero(xHiDHix_g);
gsl_matrix_set_zero(xHiDHix_e);
size_t n_size = eval->size, dc_size = xHi->size1;
size_t d_size = xHi->size2 / n_size;
double delta;
gsl_matrix *mat_dcdc = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *mat_dcdc_t = gsl_matrix_alloc(dc_size, dc_size);
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
gsl_vector_const_view xHi_col_i =
gsl_matrix_const_column(xHi, k * d_size + i);
gsl_vector_const_view xHi_col_j =
gsl_matrix_const_column(xHi, k * d_size + j);
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(1.0, &xHi_col_i.vector, &xHi_col_j.vector, mat_dcdc);
gsl_matrix_transpose_memcpy(mat_dcdc_t, mat_dcdc);
gsl_matrix_add(xHiDHix_e, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHix_g, mat_dcdc);
if (i != j) {
gsl_matrix_add(xHiDHix_e, mat_dcdc_t);
gsl_matrix_scale(mat_dcdc_t, delta);
gsl_matrix_add(xHiDHix_g, mat_dcdc_t);
}
}
gsl_matrix_free(mat_dcdc);
gsl_matrix_free(mat_dcdc_t);
return;
}
void Calc_yHiDHiDHiy(const gsl_vector *eval, const gsl_matrix *Hi,
const gsl_matrix *Hiy, const size_t i1, const size_t j1,
const size_t i2, const size_t j2, double &yHiDHiDHiy_gg,
double &yHiDHiDHiy_ee, double &yHiDHiDHiy_ge) {
yHiDHiDHiy_gg = 0.0;
yHiDHiDHiy_ee = 0.0;
yHiDHiDHiy_ge = 0.0;
size_t n_size = eval->size, d_size = Hiy->size1;
double delta, d_Hiy_i1, d_Hiy_j1, d_Hiy_i2, d_Hiy_j2;
double d_Hi_i1i2, d_Hi_i1j2, d_Hi_j1i2, d_Hi_j1j2;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
d_Hiy_i1 = gsl_matrix_get(Hiy, i1, k);
d_Hiy_j1 = gsl_matrix_get(Hiy, j1, k);
d_Hiy_i2 = gsl_matrix_get(Hiy, i2, k);
d_Hiy_j2 = gsl_matrix_get(Hiy, j2, k);
d_Hi_i1i2 = gsl_matrix_get(Hi, i1, k * d_size + i2);
d_Hi_i1j2 = gsl_matrix_get(Hi, i1, k * d_size + j2);
d_Hi_j1i2 = gsl_matrix_get(Hi, j1, k * d_size + i2);
d_Hi_j1j2 = gsl_matrix_get(Hi, j1, k * d_size + j2);
if (i1 == j1) {
yHiDHiDHiy_gg += delta * delta * (d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2);
yHiDHiDHiy_ee += (d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2);
yHiDHiDHiy_ge += delta * (d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2);
if (i2 != j2) {
yHiDHiDHiy_gg += delta * delta * (d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2);
yHiDHiDHiy_ee += (d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2);
yHiDHiDHiy_ge += delta * (d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2);
}
} else {
yHiDHiDHiy_gg += delta * delta * (d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2 +
d_Hiy_j1 * d_Hi_i1i2 * d_Hiy_j2);
yHiDHiDHiy_ee +=
(d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2 + d_Hiy_j1 * d_Hi_i1i2 * d_Hiy_j2);
yHiDHiDHiy_ge += delta * (d_Hiy_i1 * d_Hi_j1i2 * d_Hiy_j2 +
d_Hiy_j1 * d_Hi_i1i2 * d_Hiy_j2);
if (i2 != j2) {
yHiDHiDHiy_gg += delta * delta * (d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2 +
d_Hiy_j1 * d_Hi_i1j2 * d_Hiy_i2);
yHiDHiDHiy_ee +=
(d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2 + d_Hiy_j1 * d_Hi_i1j2 * d_Hiy_i2);
yHiDHiDHiy_ge += delta * (d_Hiy_i1 * d_Hi_j1j2 * d_Hiy_i2 +
d_Hiy_j1 * d_Hi_i1j2 * d_Hiy_i2);
}
}
}
return;
}
void Calc_xHiDHiDHiy(const gsl_vector *eval, const gsl_matrix *Hi,
const gsl_matrix *xHi, const gsl_matrix *Hiy,
const size_t i1, const size_t j1, const size_t i2,
const size_t j2, gsl_vector *xHiDHiDHiy_gg,
gsl_vector *xHiDHiDHiy_ee, gsl_vector *xHiDHiDHiy_ge) {
gsl_vector_set_zero(xHiDHiDHiy_gg);
gsl_vector_set_zero(xHiDHiDHiy_ee);
gsl_vector_set_zero(xHiDHiDHiy_ge);
size_t n_size = eval->size, d_size = Hiy->size1;
double delta, d_Hiy_i, d_Hiy_j, d_Hi_i1i2, d_Hi_i1j2;
double d_Hi_j1i2, d_Hi_j1j2;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
gsl_vector_const_view xHi_col_i =
gsl_matrix_const_column(xHi, k * d_size + i1);
gsl_vector_const_view xHi_col_j =
gsl_matrix_const_column(xHi, k * d_size + j1);
d_Hiy_i = gsl_matrix_get(Hiy, i2, k);
d_Hiy_j = gsl_matrix_get(Hiy, j2, k);
d_Hi_i1i2 = gsl_matrix_get(Hi, i1, k * d_size + i2);
d_Hi_i1j2 = gsl_matrix_get(Hi, i1, k * d_size + j2);
d_Hi_j1i2 = gsl_matrix_get(Hi, j1, k * d_size + i2);
d_Hi_j1j2 = gsl_matrix_get(Hi, j1, k * d_size + j2);
if (i1 == j1) {
gsl_blas_daxpy(delta * delta * d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector,
xHiDHiDHiy_ge);
if (i2 != j2) {
gsl_blas_daxpy(delta * delta * d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector,
xHiDHiDHiy_ge);
}
} else {
gsl_blas_daxpy(delta * delta * d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_j1i2 * d_Hiy_j, &xHi_col_i.vector,
xHiDHiDHiy_ge);
gsl_blas_daxpy(delta * delta * d_Hi_i1i2 * d_Hiy_j, &xHi_col_j.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_i1i2 * d_Hiy_j, &xHi_col_j.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_i1i2 * d_Hiy_j, &xHi_col_j.vector,
xHiDHiDHiy_ge);
if (i2 != j2) {
gsl_blas_daxpy(delta * delta * d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_j1j2 * d_Hiy_i, &xHi_col_i.vector,
xHiDHiDHiy_ge);
gsl_blas_daxpy(delta * delta * d_Hi_i1j2 * d_Hiy_i, &xHi_col_j.vector,
xHiDHiDHiy_gg);
gsl_blas_daxpy(d_Hi_i1j2 * d_Hiy_i, &xHi_col_j.vector, xHiDHiDHiy_ee);
gsl_blas_daxpy(delta * d_Hi_i1j2 * d_Hiy_i, &xHi_col_j.vector,
xHiDHiDHiy_ge);
}
}
}
return;
}
void Calc_xHiDHiDHix(const gsl_vector *eval, const gsl_matrix *Hi,
const gsl_matrix *xHi, const size_t i1, const size_t j1,
const size_t i2, const size_t j2,
gsl_matrix *xHiDHiDHix_gg, gsl_matrix *xHiDHiDHix_ee,
gsl_matrix *xHiDHiDHix_ge) {
gsl_matrix_set_zero(xHiDHiDHix_gg);
gsl_matrix_set_zero(xHiDHiDHix_ee);
gsl_matrix_set_zero(xHiDHiDHix_ge);
size_t n_size = eval->size, d_size = Hi->size1, dc_size = xHi->size1;
double delta, d_Hi_i1i2, d_Hi_i1j2, d_Hi_j1i2, d_Hi_j1j2;
gsl_matrix *mat_dcdc = gsl_matrix_alloc(dc_size, dc_size);
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
gsl_vector_const_view xHi_col_i1 =
gsl_matrix_const_column(xHi, k * d_size + i1);
gsl_vector_const_view xHi_col_j1 =
gsl_matrix_const_column(xHi, k * d_size + j1);
gsl_vector_const_view xHi_col_i2 =
gsl_matrix_const_column(xHi, k * d_size + i2);
gsl_vector_const_view xHi_col_j2 =
gsl_matrix_const_column(xHi, k * d_size + j2);
d_Hi_i1i2 = gsl_matrix_get(Hi, i1, k * d_size + i2);
d_Hi_i1j2 = gsl_matrix_get(Hi, i1, k * d_size + j2);
d_Hi_j1i2 = gsl_matrix_get(Hi, j1, k * d_size + i2);
d_Hi_j1j2 = gsl_matrix_get(Hi, j1, k * d_size + j2);
if (i1 == j1) {
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_j1i2, &xHi_col_i1.vector, &xHi_col_j2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
if (i2 != j2) {
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_j1j2, &xHi_col_i1.vector, &xHi_col_i2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
}
} else {
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_j1i2, &xHi_col_i1.vector, &xHi_col_j2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_i1i2, &xHi_col_j1.vector, &xHi_col_j2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
if (i2 != j2) {
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_j1j2, &xHi_col_i1.vector, &xHi_col_i2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
gsl_matrix_set_zero(mat_dcdc);
gsl_blas_dger(d_Hi_i1j2, &xHi_col_j1.vector, &xHi_col_i2.vector,
mat_dcdc);
gsl_matrix_add(xHiDHiDHix_ee, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_ge, mat_dcdc);
gsl_matrix_scale(mat_dcdc, delta);
gsl_matrix_add(xHiDHiDHix_gg, mat_dcdc);
}
}
}
gsl_matrix_free(mat_dcdc);
return;
}
void Calc_traceHiD(const gsl_vector *eval, const gsl_matrix *Hi, const size_t i,
const size_t j, double &tHiD_g, double &tHiD_e) {
tHiD_g = 0.0;
tHiD_e = 0.0;
size_t n_size = eval->size, d_size = Hi->size1;
double delta, d;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
d = gsl_matrix_get(Hi, j, k * d_size + i);
if (i == j) {
tHiD_g += delta * d;
tHiD_e += d;
} else {
tHiD_g += delta * d * 2.0;
tHiD_e += d * 2.0;
}
}
return;
}
void Calc_traceHiDHiD(const gsl_vector *eval, const gsl_matrix *Hi,
const size_t i1, const size_t j1, const size_t i2,
const size_t j2, double &tHiDHiD_gg, double &tHiDHiD_ee,
double &tHiDHiD_ge) {
tHiDHiD_gg = 0.0;
tHiDHiD_ee = 0.0;
tHiDHiD_ge = 0.0;
size_t n_size = eval->size, d_size = Hi->size1;
double delta, d_Hi_i1i2, d_Hi_i1j2, d_Hi_j1i2, d_Hi_j1j2;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
d_Hi_i1i2 = gsl_matrix_get(Hi, i1, k * d_size + i2);
d_Hi_i1j2 = gsl_matrix_get(Hi, i1, k * d_size + j2);
d_Hi_j1i2 = gsl_matrix_get(Hi, j1, k * d_size + i2);
d_Hi_j1j2 = gsl_matrix_get(Hi, j1, k * d_size + j2);
if (i1 == j1) {
tHiDHiD_gg += delta * delta * d_Hi_i1j2 * d_Hi_j1i2;
tHiDHiD_ee += d_Hi_i1j2 * d_Hi_j1i2;
tHiDHiD_ge += delta * d_Hi_i1j2 * d_Hi_j1i2;
if (i2 != j2) {
tHiDHiD_gg += delta * delta * d_Hi_i1i2 * d_Hi_j1j2;
tHiDHiD_ee += d_Hi_i1i2 * d_Hi_j1j2;
tHiDHiD_ge += delta * d_Hi_i1i2 * d_Hi_j1j2;
}
} else {
tHiDHiD_gg +=
delta * delta * (d_Hi_i1j2 * d_Hi_j1i2 + d_Hi_j1j2 * d_Hi_i1i2);
tHiDHiD_ee += (d_Hi_i1j2 * d_Hi_j1i2 + d_Hi_j1j2 * d_Hi_i1i2);
tHiDHiD_ge += delta * (d_Hi_i1j2 * d_Hi_j1i2 + d_Hi_j1j2 * d_Hi_i1i2);
if (i2 != j2) {
tHiDHiD_gg +=
delta * delta * (d_Hi_i1i2 * d_Hi_j1j2 + d_Hi_j1i2 * d_Hi_i1j2);
tHiDHiD_ee += (d_Hi_i1i2 * d_Hi_j1j2 + d_Hi_j1i2 * d_Hi_i1j2);
tHiDHiD_ge += delta * (d_Hi_i1i2 * d_Hi_j1j2 + d_Hi_j1i2 * d_Hi_i1j2);
}
}
}
return;
}
// trace(PD) = trace((Hi-HixQixHi)D)=trace(HiD) - trace(HixQixHiD)
void Calc_tracePD(const gsl_vector *eval, const gsl_matrix *Qi,
const gsl_matrix *Hi, const gsl_matrix *xHiDHix_all_g,
const gsl_matrix *xHiDHix_all_e, const size_t i,
const size_t j, double &tPD_g, double &tPD_e) {
size_t dc_size = Qi->size1, d_size = Hi->size1;
size_t v = GetIndex(i, j, d_size);
double d;
// Calculate the first part: trace(HiD).
Calc_traceHiD(eval, Hi, i, j, tPD_g, tPD_e);
// Calculate the second part: -trace(HixQixHiD).
for (size_t k = 0; k < dc_size; k++) {
gsl_vector_const_view Qi_row = gsl_matrix_const_row(Qi, k);
gsl_vector_const_view xHiDHix_g_col =
gsl_matrix_const_column(xHiDHix_all_g, v * dc_size + k);
gsl_vector_const_view xHiDHix_e_col =
gsl_matrix_const_column(xHiDHix_all_e, v * dc_size + k);
gsl_blas_ddot(&Qi_row.vector, &xHiDHix_g_col.vector, &d);
tPD_g -= d;
gsl_blas_ddot(&Qi_row.vector, &xHiDHix_e_col.vector, &d);
tPD_e -= d;
}
return;
}
// trace(PDPD) = trace((Hi-HixQixHi)D(Hi-HixQixHi)D)
// = trace(HiDHiD) - trace(HixQixHiDHiD)
// - trace(HiDHixQixHiD) + trace(HixQixHiDHixQixHiD)
void Calc_tracePDPD(const gsl_vector *eval, const gsl_matrix *Qi,
const gsl_matrix *Hi, const gsl_matrix *xHi,
const gsl_matrix *QixHiDHix_all_g,
const gsl_matrix *QixHiDHix_all_e,
const gsl_matrix *xHiDHiDHix_all_gg,
const gsl_matrix *xHiDHiDHix_all_ee,
const gsl_matrix *xHiDHiDHix_all_ge, const size_t i1,
const size_t j1, const size_t i2, const size_t j2,
double &tPDPD_gg, double &tPDPD_ee, double &tPDPD_ge) {
size_t dc_size = Qi->size1, d_size = Hi->size1;
size_t v_size = d_size * (d_size + 1) / 2;
size_t v1 = GetIndex(i1, j1, d_size), v2 = GetIndex(i2, j2, d_size);
double d;
// Calculate the first part: trace(HiDHiD).
Calc_traceHiDHiD(eval, Hi, i1, j1, i2, j2, tPDPD_gg, tPDPD_ee, tPDPD_ge);
// Calculate the second and third parts:
// -trace(HixQixHiDHiD) - trace(HiDHixQixHiD)
for (size_t i = 0; i < dc_size; i++) {
gsl_vector_const_view Qi_row = gsl_matrix_const_row(Qi, i);
gsl_vector_const_view xHiDHiDHix_gg_col = gsl_matrix_const_column(
xHiDHiDHix_all_gg, (v1 * v_size + v2) * dc_size + i);
gsl_vector_const_view xHiDHiDHix_ee_col = gsl_matrix_const_column(
xHiDHiDHix_all_ee, (v1 * v_size + v2) * dc_size + i);
gsl_vector_const_view xHiDHiDHix_ge_col = gsl_matrix_const_column(
xHiDHiDHix_all_ge, (v1 * v_size + v2) * dc_size + i);
gsl_blas_ddot(&Qi_row.vector, &xHiDHiDHix_gg_col.vector, &d);
tPDPD_gg -= d * 2.0;
gsl_blas_ddot(&Qi_row.vector, &xHiDHiDHix_ee_col.vector, &d);
tPDPD_ee -= d * 2.0;
gsl_blas_ddot(&Qi_row.vector, &xHiDHiDHix_ge_col.vector, &d);
tPDPD_ge -= d * 2.0;
}
// Calculate the fourth part: trace(HixQixHiDHixQixHiD).
for (size_t i = 0; i < dc_size; i++) {
gsl_vector_const_view QixHiDHix_g_fullrow1 =
gsl_matrix_const_row(QixHiDHix_all_g, i);
gsl_vector_const_view QixHiDHix_e_fullrow1 =
gsl_matrix_const_row(QixHiDHix_all_e, i);
gsl_vector_const_view QixHiDHix_g_row1 = gsl_vector_const_subvector(
&QixHiDHix_g_fullrow1.vector, v1 * dc_size, dc_size);
gsl_vector_const_view QixHiDHix_e_row1 = gsl_vector_const_subvector(
&QixHiDHix_e_fullrow1.vector, v1 * dc_size, dc_size);
gsl_vector_const_view QixHiDHix_g_col2 =
gsl_matrix_const_column(QixHiDHix_all_g, v2 * dc_size + i);
gsl_vector_const_view QixHiDHix_e_col2 =
gsl_matrix_const_column(QixHiDHix_all_e, v2 * dc_size + i);
gsl_blas_ddot(&QixHiDHix_g_row1.vector, &QixHiDHix_g_col2.vector, &d);
tPDPD_gg += d;
gsl_blas_ddot(&QixHiDHix_e_row1.vector, &QixHiDHix_e_col2.vector, &d);
tPDPD_ee += d;
gsl_blas_ddot(&QixHiDHix_g_row1.vector, &QixHiDHix_e_col2.vector, &d);
tPDPD_ge += d;
}
return;
}
// Calculate (xHiDHiy) for every pair (i,j).
void Calc_xHiDHiy_all(const gsl_vector *eval, const gsl_matrix *xHi,
const gsl_matrix *Hiy, gsl_matrix *xHiDHiy_all_g,
gsl_matrix *xHiDHiy_all_e) {
gsl_matrix_set_zero(xHiDHiy_all_g);
gsl_matrix_set_zero(xHiDHiy_all_e);
size_t d_size = Hiy->size1;
size_t v;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < d_size; j++) {
if (j < i) {
continue;
}
v = GetIndex(i, j, d_size);
gsl_vector_view xHiDHiy_g = gsl_matrix_column(xHiDHiy_all_g, v);
gsl_vector_view xHiDHiy_e = gsl_matrix_column(xHiDHiy_all_e, v);
Calc_xHiDHiy(eval, xHi, Hiy, i, j, &xHiDHiy_g.vector, &xHiDHiy_e.vector);
}
}
return;
}
// Calculate (xHiDHix) for every pair (i,j).
void Calc_xHiDHix_all(const gsl_vector *eval, const gsl_matrix *xHi,
gsl_matrix *xHiDHix_all_g, gsl_matrix *xHiDHix_all_e) {
gsl_matrix_set_zero(xHiDHix_all_g);
gsl_matrix_set_zero(xHiDHix_all_e);
size_t d_size = xHi->size2 / eval->size, dc_size = xHi->size1;
size_t v;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < d_size; j++) {
if (j < i) {
continue;
}
v = GetIndex(i, j, d_size);
gsl_matrix_view xHiDHix_g =
gsl_matrix_submatrix(xHiDHix_all_g, 0, v * dc_size, dc_size, dc_size);
gsl_matrix_view xHiDHix_e =
gsl_matrix_submatrix(xHiDHix_all_e, 0, v * dc_size, dc_size, dc_size);
Calc_xHiDHix(eval, xHi, i, j, &xHiDHix_g.matrix, &xHiDHix_e.matrix);
}
}
return;
}
// Calculate (xHiDHiy) for every pair (i,j).
void Calc_xHiDHiDHiy_all(const size_t v_size, const gsl_vector *eval,
const gsl_matrix *Hi, const gsl_matrix *xHi,
const gsl_matrix *Hiy, gsl_matrix *xHiDHiDHiy_all_gg,
gsl_matrix *xHiDHiDHiy_all_ee,
gsl_matrix *xHiDHiDHiy_all_ge) {
gsl_matrix_set_zero(xHiDHiDHiy_all_gg);
gsl_matrix_set_zero(xHiDHiDHiy_all_ee);
gsl_matrix_set_zero(xHiDHiDHiy_all_ge);
size_t d_size = Hiy->size1;
size_t v1, v2;
for (size_t i1 = 0; i1 < d_size; i1++) {
for (size_t j1 = 0; j1 < d_size; j1++) {
if (j1 < i1) {
continue;
}
v1 = GetIndex(i1, j1, d_size);
for (size_t i2 = 0; i2 < d_size; i2++) {
for (size_t j2 = 0; j2 < d_size; j2++) {
if (j2 < i2) {
continue;
}
v2 = GetIndex(i2, j2, d_size);
gsl_vector_view xHiDHiDHiy_gg =
gsl_matrix_column(xHiDHiDHiy_all_gg, v1 * v_size + v2);
gsl_vector_view xHiDHiDHiy_ee =
gsl_matrix_column(xHiDHiDHiy_all_ee, v1 * v_size + v2);
gsl_vector_view xHiDHiDHiy_ge =
gsl_matrix_column(xHiDHiDHiy_all_ge, v1 * v_size + v2);
Calc_xHiDHiDHiy(eval, Hi, xHi, Hiy, i1, j1, i2, j2,
&xHiDHiDHiy_gg.vector, &xHiDHiDHiy_ee.vector,
&xHiDHiDHiy_ge.vector);
}
}
}
}
return;
}
// Calculate (xHiDHix) for every pair (i,j).
void Calc_xHiDHiDHix_all(const size_t v_size, const gsl_vector *eval,
const gsl_matrix *Hi, const gsl_matrix *xHi,
gsl_matrix *xHiDHiDHix_all_gg,
gsl_matrix *xHiDHiDHix_all_ee,
gsl_matrix *xHiDHiDHix_all_ge) {
gsl_matrix_set_zero(xHiDHiDHix_all_gg);
gsl_matrix_set_zero(xHiDHiDHix_all_ee);
gsl_matrix_set_zero(xHiDHiDHix_all_ge);
size_t d_size = xHi->size2 / eval->size, dc_size = xHi->size1;
size_t v1, v2;
for (size_t i1 = 0; i1 < d_size; i1++) {
for (size_t j1 = 0; j1 < d_size; j1++) {
if (j1 < i1) {
continue;
}
v1 = GetIndex(i1, j1, d_size);
for (size_t i2 = 0; i2 < d_size; i2++) {
for (size_t j2 = 0; j2 < d_size; j2++) {
if (j2 < i2) {
continue;
}
v2 = GetIndex(i2, j2, d_size);
if (v2 < v1) {
continue;
}
gsl_matrix_view xHiDHiDHix_gg1 = gsl_matrix_submatrix(
xHiDHiDHix_all_gg, 0, (v1 * v_size + v2) * dc_size, dc_size,
dc_size);
gsl_matrix_view xHiDHiDHix_ee1 = gsl_matrix_submatrix(
xHiDHiDHix_all_ee, 0, (v1 * v_size + v2) * dc_size, dc_size,
dc_size);
gsl_matrix_view xHiDHiDHix_ge1 = gsl_matrix_submatrix(
xHiDHiDHix_all_ge, 0, (v1 * v_size + v2) * dc_size, dc_size,
dc_size);
Calc_xHiDHiDHix(eval, Hi, xHi, i1, j1, i2, j2, &xHiDHiDHix_gg1.matrix,
&xHiDHiDHix_ee1.matrix, &xHiDHiDHix_ge1.matrix);
if (v2 != v1) {
gsl_matrix_view xHiDHiDHix_gg2 = gsl_matrix_submatrix(
xHiDHiDHix_all_gg, 0, (v2 * v_size + v1) * dc_size, dc_size,
dc_size);
gsl_matrix_view xHiDHiDHix_ee2 = gsl_matrix_submatrix(
xHiDHiDHix_all_ee, 0, (v2 * v_size + v1) * dc_size, dc_size,
dc_size);
gsl_matrix_view xHiDHiDHix_ge2 = gsl_matrix_submatrix(
xHiDHiDHix_all_ge, 0, (v2 * v_size + v1) * dc_size, dc_size,
dc_size);
gsl_matrix_memcpy(&xHiDHiDHix_gg2.matrix, &xHiDHiDHix_gg1.matrix);
gsl_matrix_memcpy(&xHiDHiDHix_ee2.matrix, &xHiDHiDHix_ee1.matrix);
gsl_matrix_memcpy(&xHiDHiDHix_ge2.matrix, &xHiDHiDHix_ge1.matrix);
}
}
}
}
}
return;
}
// Calculate (xHiDHix)Qi(xHiy) for every pair (i,j).
void Calc_xHiDHixQixHiy_all(const gsl_matrix *xHiDHix_all_g,
const gsl_matrix *xHiDHix_all_e,
const gsl_vector *QixHiy,
gsl_matrix *xHiDHixQixHiy_all_g,
gsl_matrix *xHiDHixQixHiy_all_e) {
size_t dc_size = xHiDHix_all_g->size1;
size_t v_size = xHiDHix_all_g->size2 / dc_size;
for (size_t i = 0; i < v_size; i++) {
gsl_matrix_const_view xHiDHix_g = gsl_matrix_const_submatrix(
xHiDHix_all_g, 0, i * dc_size, dc_size, dc_size);
gsl_matrix_const_view xHiDHix_e = gsl_matrix_const_submatrix(
xHiDHix_all_e, 0, i * dc_size, dc_size, dc_size);
gsl_vector_view xHiDHixQixHiy_g = gsl_matrix_column(xHiDHixQixHiy_all_g, i);
gsl_vector_view xHiDHixQixHiy_e = gsl_matrix_column(xHiDHixQixHiy_all_e, i);
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHiDHix_g.matrix, QixHiy, 0.0,
&xHiDHixQixHiy_g.vector);
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHiDHix_e.matrix, QixHiy, 0.0,
&xHiDHixQixHiy_e.vector);
}
return;
}
// Calculate Qi(xHiDHiy) and Qi(xHiDHix)Qi(xHiy) for each pair of i,j (i<=j).
void Calc_QiVec_all(const gsl_matrix *Qi, const gsl_matrix *vec_all_g,
const gsl_matrix *vec_all_e, gsl_matrix *Qivec_all_g,
gsl_matrix *Qivec_all_e) {
for (size_t i = 0; i < vec_all_g->size2; i++) {
gsl_vector_const_view vec_g = gsl_matrix_const_column(vec_all_g, i);
gsl_vector_const_view vec_e = gsl_matrix_const_column(vec_all_e, i);
gsl_vector_view Qivec_g = gsl_matrix_column(Qivec_all_g, i);
gsl_vector_view Qivec_e = gsl_matrix_column(Qivec_all_e, i);
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, &vec_g.vector, 0.0, &Qivec_g.vector);
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, &vec_e.vector, 0.0, &Qivec_e.vector);
}
return;
}
// Calculate Qi(xHiDHix) for each pair of i,j (i<=j).
void Calc_QiMat_all(const gsl_matrix *Qi, const gsl_matrix *mat_all_g,
const gsl_matrix *mat_all_e, gsl_matrix *Qimat_all_g,
gsl_matrix *Qimat_all_e) {
size_t dc_size = Qi->size1;
size_t v_size = mat_all_g->size2 / mat_all_g->size1;
for (size_t i = 0; i < v_size; i++) {
gsl_matrix_const_view mat_g =
gsl_matrix_const_submatrix(mat_all_g, 0, i * dc_size, dc_size, dc_size);
gsl_matrix_const_view mat_e =
gsl_matrix_const_submatrix(mat_all_e, 0, i * dc_size, dc_size, dc_size);
gsl_matrix_view Qimat_g =
gsl_matrix_submatrix(Qimat_all_g, 0, i * dc_size, dc_size, dc_size);
gsl_matrix_view Qimat_e =
gsl_matrix_submatrix(Qimat_all_e, 0, i * dc_size, dc_size, dc_size);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, &mat_g.matrix, 0.0,
&Qimat_g.matrix);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, &mat_e.matrix, 0.0,
&Qimat_e.matrix);
}
return;
}
// Calculate yPDPy
// yPDPy = y(Hi-HixQixHi)D(Hi-HixQixHi)y
// = ytHiDHiy - (yHix)Qi(xHiDHiy) - (yHiDHix)Qi(xHiy)
// + (yHix)Qi(xHiDHix)Qi(xtHiy)
void Calc_yPDPy(const gsl_vector *eval, const gsl_matrix *Hiy,
const gsl_vector *QixHiy, const gsl_matrix *xHiDHiy_all_g,
const gsl_matrix *xHiDHiy_all_e,
const gsl_matrix *xHiDHixQixHiy_all_g,
const gsl_matrix *xHiDHixQixHiy_all_e, const size_t i,
const size_t j, double &yPDPy_g, double &yPDPy_e) {
size_t d_size = Hiy->size1;
size_t v = GetIndex(i, j, d_size);
double d;
// First part: ytHiDHiy.
Calc_yHiDHiy(eval, Hiy, i, j, yPDPy_g, yPDPy_e);
// Second and third parts: -(yHix)Qi(xHiDHiy)-(yHiDHix)Qi(xHiy)
gsl_vector_const_view xHiDHiy_g = gsl_matrix_const_column(xHiDHiy_all_g, v);
gsl_vector_const_view xHiDHiy_e = gsl_matrix_const_column(xHiDHiy_all_e, v);
gsl_blas_ddot(QixHiy, &xHiDHiy_g.vector, &d);
yPDPy_g -= d * 2.0;
gsl_blas_ddot(QixHiy, &xHiDHiy_e.vector, &d);
yPDPy_e -= d * 2.0;
// Fourth part: +(yHix)Qi(xHiDHix)Qi(xHiy).
gsl_vector_const_view xHiDHixQixHiy_g =
gsl_matrix_const_column(xHiDHixQixHiy_all_g, v);
gsl_vector_const_view xHiDHixQixHiy_e =
gsl_matrix_const_column(xHiDHixQixHiy_all_e, v);
gsl_blas_ddot(QixHiy, &xHiDHixQixHiy_g.vector, &d);
yPDPy_g += d;
gsl_blas_ddot(QixHiy, &xHiDHixQixHiy_e.vector, &d);
yPDPy_e += d;
return;
}
// calculate yPDPDPy = y(Hi-HixQixHi)D(Hi-HixQixHi)D(Hi-HixQixHi)y
// yPDPDPy = yHiDHiDHiy
// - (yHix)Qi(xHiDHiDHiy)-(yHiDHiDHix)Qi(xHiy)
// - (yHiDHix)Qi(xHiDHiy)
// + (yHix)Qi(xHiDHix)Qi(xHiDHiy)
// + (yHiDHix)Qi(xHiDHix)Qi(xHiy)
// + (yHix)Qi(xHiDHiDHix)Qi(xHiy)
// - (yHix)Qi(xHiDHix)Qi(xHiDHix)Qi(xHiy)
void Calc_yPDPDPy(
const gsl_vector *eval, const gsl_matrix *Hi, const gsl_matrix *xHi,
const gsl_matrix *Hiy, const gsl_vector *QixHiy,
const gsl_matrix *xHiDHiy_all_g, const gsl_matrix *xHiDHiy_all_e,
const gsl_matrix *QixHiDHiy_all_g, const gsl_matrix *QixHiDHiy_all_e,
const gsl_matrix *xHiDHixQixHiy_all_g,
const gsl_matrix *xHiDHixQixHiy_all_e,
const gsl_matrix *QixHiDHixQixHiy_all_g,
const gsl_matrix *QixHiDHixQixHiy_all_e,
const gsl_matrix *xHiDHiDHiy_all_gg, const gsl_matrix *xHiDHiDHiy_all_ee,
const gsl_matrix *xHiDHiDHiy_all_ge, const gsl_matrix *xHiDHiDHix_all_gg,
const gsl_matrix *xHiDHiDHix_all_ee, const gsl_matrix *xHiDHiDHix_all_ge,
const size_t i1, const size_t j1, const size_t i2, const size_t j2,
double &yPDPDPy_gg, double &yPDPDPy_ee, double &yPDPDPy_ge) {
size_t d_size = Hi->size1, dc_size = xHi->size1;
size_t v1 = GetIndex(i1, j1, d_size), v2 = GetIndex(i2, j2, d_size);
size_t v_size = d_size * (d_size + 1) / 2;
double d;
gsl_vector *xHiDHiDHixQixHiy = gsl_vector_alloc(dc_size);
// First part: yHiDHiDHiy.
Calc_yHiDHiDHiy(eval, Hi, Hiy, i1, j1, i2, j2, yPDPDPy_gg, yPDPDPy_ee,
yPDPDPy_ge);
// Second and third parts:
// -(yHix)Qi(xHiDHiDHiy) - (yHiDHiDHix)Qi(xHiy).
gsl_vector_const_view xHiDHiDHiy_gg1 =
gsl_matrix_const_column(xHiDHiDHiy_all_gg, v1 * v_size + v2);
gsl_vector_const_view xHiDHiDHiy_ee1 =
gsl_matrix_const_column(xHiDHiDHiy_all_ee, v1 * v_size + v2);
gsl_vector_const_view xHiDHiDHiy_ge1 =
gsl_matrix_const_column(xHiDHiDHiy_all_ge, v1 * v_size + v2);
gsl_vector_const_view xHiDHiDHiy_gg2 =
gsl_matrix_const_column(xHiDHiDHiy_all_gg, v2 * v_size + v1);
gsl_vector_const_view xHiDHiDHiy_ee2 =
gsl_matrix_const_column(xHiDHiDHiy_all_ee, v2 * v_size + v1);
gsl_vector_const_view xHiDHiDHiy_ge2 =
gsl_matrix_const_column(xHiDHiDHiy_all_ge, v2 * v_size + v1);
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_gg1.vector, &d);
yPDPDPy_gg -= d;
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_ee1.vector, &d);
yPDPDPy_ee -= d;
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_ge1.vector, &d);
yPDPDPy_ge -= d;
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_gg2.vector, &d);
yPDPDPy_gg -= d;
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_ee2.vector, &d);
yPDPDPy_ee -= d;
gsl_blas_ddot(QixHiy, &xHiDHiDHiy_ge2.vector, &d);
yPDPDPy_ge -= d;
// Fourth part: - (yHiDHix)Qi(xHiDHiy).
gsl_vector_const_view xHiDHiy_g1 = gsl_matrix_const_column(xHiDHiy_all_g, v1);
gsl_vector_const_view xHiDHiy_e1 = gsl_matrix_const_column(xHiDHiy_all_e, v1);
gsl_vector_const_view QixHiDHiy_g2 =
gsl_matrix_const_column(QixHiDHiy_all_g, v2);
gsl_vector_const_view QixHiDHiy_e2 =
gsl_matrix_const_column(QixHiDHiy_all_e, v2);
gsl_blas_ddot(&xHiDHiy_g1.vector, &QixHiDHiy_g2.vector, &d);
yPDPDPy_gg -= d;
gsl_blas_ddot(&xHiDHiy_e1.vector, &QixHiDHiy_e2.vector, &d);
yPDPDPy_ee -= d;
gsl_blas_ddot(&xHiDHiy_g1.vector, &QixHiDHiy_e2.vector, &d);
yPDPDPy_ge -= d;
// Fifth and sixth parts:
// + (yHix)Qi(xHiDHix)Qi(xHiDHiy) +
// (yHiDHix)Qi(xHiDHix)Qi(xHiy)
gsl_vector_const_view QixHiDHiy_g1 =
gsl_matrix_const_column(QixHiDHiy_all_g, v1);
gsl_vector_const_view QixHiDHiy_e1 =
gsl_matrix_const_column(QixHiDHiy_all_e, v1);
gsl_vector_const_view xHiDHixQixHiy_g1 =
gsl_matrix_const_column(xHiDHixQixHiy_all_g, v1);
gsl_vector_const_view xHiDHixQixHiy_e1 =
gsl_matrix_const_column(xHiDHixQixHiy_all_e, v1);
gsl_vector_const_view xHiDHixQixHiy_g2 =
gsl_matrix_const_column(xHiDHixQixHiy_all_g, v2);
gsl_vector_const_view xHiDHixQixHiy_e2 =
gsl_matrix_const_column(xHiDHixQixHiy_all_e, v2);
gsl_blas_ddot(&xHiDHixQixHiy_g1.vector, &QixHiDHiy_g2.vector, &d);
yPDPDPy_gg += d;
gsl_blas_ddot(&xHiDHixQixHiy_g2.vector, &QixHiDHiy_g1.vector, &d);
yPDPDPy_gg += d;
gsl_blas_ddot(&xHiDHixQixHiy_e1.vector, &QixHiDHiy_e2.vector, &d);
yPDPDPy_ee += d;
gsl_blas_ddot(&xHiDHixQixHiy_e2.vector, &QixHiDHiy_e1.vector, &d);
yPDPDPy_ee += d;
gsl_blas_ddot(&xHiDHixQixHiy_g1.vector, &QixHiDHiy_e2.vector, &d);
yPDPDPy_ge += d;
gsl_blas_ddot(&xHiDHixQixHiy_e2.vector, &QixHiDHiy_g1.vector, &d);
yPDPDPy_ge += d;
// Seventh part: + (yHix)Qi(xHiDHiDHix)Qi(xHiy)
gsl_matrix_const_view xHiDHiDHix_gg = gsl_matrix_const_submatrix(
xHiDHiDHix_all_gg, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_matrix_const_view xHiDHiDHix_ee = gsl_matrix_const_submatrix(
xHiDHiDHix_all_ee, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_matrix_const_view xHiDHiDHix_ge = gsl_matrix_const_submatrix(
xHiDHiDHix_all_ge, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHiDHiDHix_gg.matrix, QixHiy, 0.0,
xHiDHiDHixQixHiy);
gsl_blas_ddot(xHiDHiDHixQixHiy, QixHiy, &d);
yPDPDPy_gg += d;
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHiDHiDHix_ee.matrix, QixHiy, 0.0,
xHiDHiDHixQixHiy);
gsl_blas_ddot(xHiDHiDHixQixHiy, QixHiy, &d);
yPDPDPy_ee += d;
gsl_blas_dgemv(CblasNoTrans, 1.0, &xHiDHiDHix_ge.matrix, QixHiy, 0.0,
xHiDHiDHixQixHiy);
gsl_blas_ddot(xHiDHiDHixQixHiy, QixHiy, &d);
yPDPDPy_ge += d;
// Eighth part: - (yHix)Qi(xHiDHix)Qi(xHiDHix)Qi(xHiy).
gsl_vector_const_view QixHiDHixQixHiy_g1 =
gsl_matrix_const_column(QixHiDHixQixHiy_all_g, v1);
gsl_vector_const_view QixHiDHixQixHiy_e1 =
gsl_matrix_const_column(QixHiDHixQixHiy_all_e, v1);
gsl_blas_ddot(&QixHiDHixQixHiy_g1.vector, &xHiDHixQixHiy_g2.vector, &d);
yPDPDPy_gg -= d;
gsl_blas_ddot(&QixHiDHixQixHiy_e1.vector, &xHiDHixQixHiy_e2.vector, &d);
yPDPDPy_ee -= d;
gsl_blas_ddot(&QixHiDHixQixHiy_g1.vector, &xHiDHixQixHiy_e2.vector, &d);
yPDPDPy_ge -= d;
// Free memory.
gsl_vector_free(xHiDHiDHixQixHiy);
return;
}
// Calculate Edgeworth correctation factors for small samples notation
// and method follows Thomas J. Rothenberg, Econometirca 1984; 52 (4)
// M=xHiDHix
void CalcCRT(const gsl_matrix *Hessian_inv, const gsl_matrix *Qi,
const gsl_matrix *QixHiDHix_all_g,
const gsl_matrix *QixHiDHix_all_e,
const gsl_matrix *xHiDHiDHix_all_gg,
const gsl_matrix *xHiDHiDHix_all_ee,
const gsl_matrix *xHiDHiDHix_all_ge, const size_t d_size,
double &crt_a, double &crt_b, double &crt_c) {
crt_a = 0.0;
crt_b = 0.0;
crt_c = 0.0;
size_t dc_size = Qi->size1, v_size = Hessian_inv->size1 / 2;
size_t c_size = dc_size / d_size;
double h_gg, h_ge, h_ee, d, B = 0.0, C = 0.0, D = 0.0;
double trCg1, trCe1, trCg2, trCe2, trB_gg, trB_ge, trB_ee;
double trCC_gg, trCC_ge, trCC_ee, trD_gg = 0.0, trD_ge = 0.0, trD_ee = 0.0;
gsl_matrix *QiMQi_g1 = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQi_e1 = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQi_g2 = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQi_e2 = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQisQisi_g1 = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *QiMQisQisi_e1 = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *QiMQisQisi_g2 = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *QiMQisQisi_e2 = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *QiMQiMQi_gg = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQiMQi_ge = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMQiMQi_ee = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMMQi_gg = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMMQi_ge = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *QiMMQi_ee = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *Qi_si = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *M_dd = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *M_dcdc = gsl_matrix_alloc(dc_size, dc_size);
// Invert Qi_sub to Qi_si.
gsl_matrix *Qi_sub = gsl_matrix_alloc(d_size, d_size);
gsl_matrix_const_view Qi_s = gsl_matrix_const_submatrix(
Qi, (c_size - 1) * d_size, (c_size - 1) * d_size, d_size, d_size);
int sig;
gsl_permutation *pmt = gsl_permutation_alloc(d_size);
gsl_matrix_memcpy(Qi_sub, &Qi_s.matrix);
LUDecomp(Qi_sub, pmt, &sig);
LUInvert(Qi_sub, pmt, Qi_si);
gsl_permutation_free(pmt);
gsl_matrix_free(Qi_sub);
// Calculate correction factors.
for (size_t v1 = 0; v1 < v_size; v1++) {
// Calculate Qi(xHiDHix)Qi, and subpart of it.
gsl_matrix_const_view QiM_g1 = gsl_matrix_const_submatrix(
QixHiDHix_all_g, 0, v1 * dc_size, dc_size, dc_size);
gsl_matrix_const_view QiM_e1 = gsl_matrix_const_submatrix(
QixHiDHix_all_e, 0, v1 * dc_size, dc_size, dc_size);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_g1.matrix, Qi, 0.0,
QiMQi_g1);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_e1.matrix, Qi, 0.0,
QiMQi_e1);
gsl_matrix_view QiMQi_g1_s = gsl_matrix_submatrix(
QiMQi_g1, (c_size - 1) * d_size, (c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMQi_e1_s = gsl_matrix_submatrix(
QiMQi_e1, (c_size - 1) * d_size, (c_size - 1) * d_size, d_size, d_size);
// Calculate trCg1 and trCe1.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQi_g1_s.matrix, Qi_si,
0.0, QiMQisQisi_g1);
trCg1 = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCg1 -= gsl_matrix_get(QiMQisQisi_g1, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQi_e1_s.matrix, Qi_si,
0.0, QiMQisQisi_e1);
trCe1 = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCe1 -= gsl_matrix_get(QiMQisQisi_e1, k, k);
}
for (size_t v2 = 0; v2 < v_size; v2++) {
if (v2 < v1) {
continue;
}
// Calculate Qi(xHiDHix)Qi, and subpart of it.
gsl_matrix_const_view QiM_g2 = gsl_matrix_const_submatrix(
QixHiDHix_all_g, 0, v2 * dc_size, dc_size, dc_size);
gsl_matrix_const_view QiM_e2 = gsl_matrix_const_submatrix(
QixHiDHix_all_e, 0, v2 * dc_size, dc_size, dc_size);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_g2.matrix, Qi, 0.0,
QiMQi_g2);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_e2.matrix, Qi, 0.0,
QiMQi_e2);
gsl_matrix_view QiMQi_g2_s =
gsl_matrix_submatrix(QiMQi_g2, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMQi_e2_s =
gsl_matrix_submatrix(QiMQi_e2, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
// Calculate trCg2 and trCe2.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQi_g2_s.matrix, Qi_si,
0.0, QiMQisQisi_g2);
trCg2 = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCg2 -= gsl_matrix_get(QiMQisQisi_g2, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQi_e2_s.matrix, Qi_si,
0.0, QiMQisQisi_e2);
trCe2 = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCe2 -= gsl_matrix_get(QiMQisQisi_e2, k, k);
}
// Calculate trCC_gg, trCC_ge, trCC_ee.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, QiMQisQisi_g1,
QiMQisQisi_g2, 0.0, M_dd);
trCC_gg = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCC_gg += gsl_matrix_get(M_dd, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, QiMQisQisi_g1,
QiMQisQisi_e2, 0.0, M_dd);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, QiMQisQisi_e1,
QiMQisQisi_g2, 1.0, M_dd);
trCC_ge = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCC_ge += gsl_matrix_get(M_dd, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, QiMQisQisi_e1,
QiMQisQisi_e2, 0.0, M_dd);
trCC_ee = 0.0;
for (size_t k = 0; k < d_size; k++) {
trCC_ee += gsl_matrix_get(M_dd, k, k);
}
// Calculate Qi(xHiDHix)Qi(xHiDHix)Qi, and subpart of it.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_g1.matrix, QiMQi_g2,
0.0, QiMQiMQi_gg);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_g1.matrix, QiMQi_e2,
0.0, QiMQiMQi_ge);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_e1.matrix, QiMQi_g2,
1.0, QiMQiMQi_ge);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiM_e1.matrix, QiMQi_e2,
0.0, QiMQiMQi_ee);
gsl_matrix_view QiMQiMQi_gg_s =
gsl_matrix_submatrix(QiMQiMQi_gg, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMQiMQi_ge_s =
gsl_matrix_submatrix(QiMQiMQi_ge, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMQiMQi_ee_s =
gsl_matrix_submatrix(QiMQiMQi_ee, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
// and part of trB_gg, trB_ge, trB_ee.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQiMQi_gg_s.matrix,
Qi_si, 0.0, M_dd);
trB_gg = 0.0;
for (size_t k = 0; k < d_size; k++) {
d = gsl_matrix_get(M_dd, k, k);
trB_gg -= d;
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQiMQi_ge_s.matrix,
Qi_si, 0.0, M_dd);
trB_ge = 0.0;
for (size_t k = 0; k < d_size; k++) {
d = gsl_matrix_get(M_dd, k, k);
trB_ge -= d;
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMQiMQi_ee_s.matrix,
Qi_si, 0.0, M_dd);
trB_ee = 0.0;
for (size_t k = 0; k < d_size; k++) {
d = gsl_matrix_get(M_dd, k, k);
trB_ee -= d;
}
// Calculate Qi(xHiDHiDHix)Qi, and subpart of it.
gsl_matrix_const_view MM_gg = gsl_matrix_const_submatrix(
xHiDHiDHix_all_gg, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_matrix_const_view MM_ge = gsl_matrix_const_submatrix(
xHiDHiDHix_all_ge, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_matrix_const_view MM_ee = gsl_matrix_const_submatrix(
xHiDHiDHix_all_ee, 0, (v1 * v_size + v2) * dc_size, dc_size, dc_size);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, &MM_gg.matrix, 0.0,
M_dcdc);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, M_dcdc, Qi, 0.0,
QiMMQi_gg);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, &MM_ge.matrix, 0.0,
M_dcdc);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, M_dcdc, Qi, 0.0,
QiMMQi_ge);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, Qi, &MM_ee.matrix, 0.0,
M_dcdc);
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, M_dcdc, Qi, 0.0,
QiMMQi_ee);
gsl_matrix_view QiMMQi_gg_s =
gsl_matrix_submatrix(QiMMQi_gg, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMMQi_ge_s =
gsl_matrix_submatrix(QiMMQi_ge, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
gsl_matrix_view QiMMQi_ee_s =
gsl_matrix_submatrix(QiMMQi_ee, (c_size - 1) * d_size,
(c_size - 1) * d_size, d_size, d_size);
// Calculate the other part of trB_gg, trB_ge, trB_ee.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMMQi_gg_s.matrix,
Qi_si, 0.0, M_dd);
for (size_t k = 0; k < d_size; k++) {
trB_gg += gsl_matrix_get(M_dd, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMMQi_ge_s.matrix,
Qi_si, 0.0, M_dd);
for (size_t k = 0; k < d_size; k++) {
trB_ge += 2.0 * gsl_matrix_get(M_dd, k, k);
}
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, &QiMMQi_ee_s.matrix,
Qi_si, 0.0, M_dd);
for (size_t k = 0; k < d_size; k++) {
trB_ee += gsl_matrix_get(M_dd, k, k);
}
// Calculate trD_gg, trD_ge, trD_ee.
trD_gg = 2.0 * trB_gg;
trD_ge = 2.0 * trB_ge;
trD_ee = 2.0 * trB_ee;
// calculate B, C and D
h_gg = -1.0 * gsl_matrix_get(Hessian_inv, v1, v2);
h_ge = -1.0 * gsl_matrix_get(Hessian_inv, v1, v2 + v_size);
h_ee = -1.0 * gsl_matrix_get(Hessian_inv, v1 + v_size, v2 + v_size);
B += h_gg * trB_gg + h_ge * trB_ge + h_ee * trB_ee;
C += h_gg * (trCC_gg + 0.5 * trCg1 * trCg2) +
h_ge * (trCC_ge + 0.5 * trCg1 * trCe2 + 0.5 * trCe1 * trCg2) +
h_ee * (trCC_ee + 0.5 * trCe1 * trCe2);
D += h_gg * (trCC_gg + 0.5 * trD_gg) + h_ge * (trCC_ge + 0.5 * trD_ge) +
h_ee * (trCC_ee + 0.5 * trD_ee);
if (v1 != v2) {
B += h_gg * trB_gg + h_ge * trB_ge + h_ee * trB_ee;
C += h_gg * (trCC_gg + 0.5 * trCg1 * trCg2) +
h_ge * (trCC_ge + 0.5 * trCg1 * trCe2 + 0.5 * trCe1 * trCg2) +
h_ee * (trCC_ee + 0.5 * trCe1 * trCe2);
D += h_gg * (trCC_gg + 0.5 * trD_gg) + h_ge * (trCC_ge + 0.5 * trD_ge) +
h_ee * (trCC_ee + 0.5 * trD_ee);
}
}
}
// Calculate a, b, c from B C D.
crt_a = 2.0 * D - C;
crt_b = 2.0 * B;
crt_c = C;
// Free matrix memory.
gsl_matrix_free(QiMQi_g1);
gsl_matrix_free(QiMQi_e1);
gsl_matrix_free(QiMQi_g2);
gsl_matrix_free(QiMQi_e2);
gsl_matrix_free(QiMQisQisi_g1);
gsl_matrix_free(QiMQisQisi_e1);
gsl_matrix_free(QiMQisQisi_g2);
gsl_matrix_free(QiMQisQisi_e2);
gsl_matrix_free(QiMQiMQi_gg);
gsl_matrix_free(QiMQiMQi_ge);
gsl_matrix_free(QiMQiMQi_ee);
gsl_matrix_free(QiMMQi_gg);
gsl_matrix_free(QiMMQi_ge);
gsl_matrix_free(QiMMQi_ee);
gsl_matrix_free(Qi_si);
gsl_matrix_free(M_dd);
gsl_matrix_free(M_dcdc);
return;
}
// Calculate first-order and second-order derivatives.
void CalcDev(const char func_name, const gsl_vector *eval, const gsl_matrix *Qi,
const gsl_matrix *Hi, const gsl_matrix *xHi, const gsl_matrix *Hiy,
const gsl_vector *QixHiy, gsl_vector *gradient,
gsl_matrix *Hessian_inv, double &crt_a, double &crt_b,
double &crt_c) {
if (func_name != 'R' && func_name != 'L' && func_name != 'r' &&
func_name != 'l') {
cout << "func_name only takes 'R' or 'L': 'R' for "
<< "log-restricted likelihood, 'L' for log-likelihood." << endl;
return;
}
size_t dc_size = Qi->size1, d_size = Hi->size1;
size_t c_size = dc_size / d_size;
size_t v_size = d_size * (d_size + 1) / 2;
size_t v1, v2;
double dev1_g, dev1_e, dev2_gg, dev2_ee, dev2_ge;
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
gsl_matrix *xHiDHiy_all_g = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *xHiDHiy_all_e = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *xHiDHix_all_g = gsl_matrix_alloc(dc_size, v_size * dc_size);
gsl_matrix *xHiDHix_all_e = gsl_matrix_alloc(dc_size, v_size * dc_size);
gsl_matrix *xHiDHixQixHiy_all_g = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *xHiDHixQixHiy_all_e = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *QixHiDHiy_all_g = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *QixHiDHiy_all_e = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *QixHiDHix_all_g = gsl_matrix_alloc(dc_size, v_size * dc_size);
gsl_matrix *QixHiDHix_all_e = gsl_matrix_alloc(dc_size, v_size * dc_size);
gsl_matrix *QixHiDHixQixHiy_all_g = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *QixHiDHixQixHiy_all_e = gsl_matrix_alloc(dc_size, v_size);
gsl_matrix *xHiDHiDHiy_all_gg = gsl_matrix_alloc(dc_size, v_size * v_size);
gsl_matrix *xHiDHiDHiy_all_ee = gsl_matrix_alloc(dc_size, v_size * v_size);
gsl_matrix *xHiDHiDHiy_all_ge = gsl_matrix_alloc(dc_size, v_size * v_size);
gsl_matrix *xHiDHiDHix_all_gg =
gsl_matrix_alloc(dc_size, v_size * v_size * dc_size);
gsl_matrix *xHiDHiDHix_all_ee =
gsl_matrix_alloc(dc_size, v_size * v_size * dc_size);
gsl_matrix *xHiDHiDHix_all_ge =
gsl_matrix_alloc(dc_size, v_size * v_size * dc_size);
// Calculate xHiDHiy_all, xHiDHix_all and xHiDHixQixHiy_all.
Calc_xHiDHiy_all(eval, xHi, Hiy, xHiDHiy_all_g, xHiDHiy_all_e);
Calc_xHiDHix_all(eval, xHi, xHiDHix_all_g, xHiDHix_all_e);
Calc_xHiDHixQixHiy_all(xHiDHix_all_g, xHiDHix_all_e, QixHiy,
xHiDHixQixHiy_all_g, xHiDHixQixHiy_all_e);
Calc_xHiDHiDHiy_all(v_size, eval, Hi, xHi, Hiy, xHiDHiDHiy_all_gg,
xHiDHiDHiy_all_ee, xHiDHiDHiy_all_ge);
Calc_xHiDHiDHix_all(v_size, eval, Hi, xHi, xHiDHiDHix_all_gg,
xHiDHiDHix_all_ee, xHiDHiDHix_all_ge);
// Calculate QixHiDHiy_all, QixHiDHix_all and QixHiDHixQixHiy_all.
Calc_QiVec_all(Qi, xHiDHiy_all_g, xHiDHiy_all_e, QixHiDHiy_all_g,
QixHiDHiy_all_e);
Calc_QiVec_all(Qi, xHiDHixQixHiy_all_g, xHiDHixQixHiy_all_e,
QixHiDHixQixHiy_all_g, QixHiDHixQixHiy_all_e);
Calc_QiMat_all(Qi, xHiDHix_all_g, xHiDHix_all_e, QixHiDHix_all_g,
QixHiDHix_all_e);
double tHiD_g, tHiD_e, tPD_g, tPD_e, tHiDHiD_gg, tHiDHiD_ee;
double tHiDHiD_ge, tPDPD_gg, tPDPD_ee, tPDPD_ge;
double yPDPy_g, yPDPy_e, yPDPDPy_gg, yPDPDPy_ee, yPDPDPy_ge;
// Calculate gradient and Hessian for Vg.
for (size_t i1 = 0; i1 < d_size; i1++) {
for (size_t j1 = 0; j1 < d_size; j1++) {
if (j1 < i1) {
continue;
}
v1 = GetIndex(i1, j1, d_size);
Calc_yPDPy(eval, Hiy, QixHiy, xHiDHiy_all_g, xHiDHiy_all_e,
xHiDHixQixHiy_all_g, xHiDHixQixHiy_all_e, i1, j1, yPDPy_g,
yPDPy_e);
if (func_name == 'R' || func_name == 'r') {
Calc_tracePD(eval, Qi, Hi, xHiDHix_all_g, xHiDHix_all_e, i1, j1, tPD_g,
tPD_e);
dev1_g = -0.5 * tPD_g + 0.5 * yPDPy_g;
dev1_e = -0.5 * tPD_e + 0.5 * yPDPy_e;
} else {
Calc_traceHiD(eval, Hi, i1, j1, tHiD_g, tHiD_e);
dev1_g = -0.5 * tHiD_g + 0.5 * yPDPy_g;
dev1_e = -0.5 * tHiD_e + 0.5 * yPDPy_e;
}
gsl_vector_set(gradient, v1, dev1_g);
gsl_vector_set(gradient, v1 + v_size, dev1_e);
for (size_t i2 = 0; i2 < d_size; i2++) {
for (size_t j2 = 0; j2 < d_size; j2++) {
if (j2 < i2) {
continue;
}
v2 = GetIndex(i2, j2, d_size);
if (v2 < v1) {
continue;
}
Calc_yPDPDPy(eval, Hi, xHi, Hiy, QixHiy, xHiDHiy_all_g, xHiDHiy_all_e,
QixHiDHiy_all_g, QixHiDHiy_all_e, xHiDHixQixHiy_all_g,
xHiDHixQixHiy_all_e, QixHiDHixQixHiy_all_g,
QixHiDHixQixHiy_all_e, xHiDHiDHiy_all_gg,
xHiDHiDHiy_all_ee, xHiDHiDHiy_all_ge, xHiDHiDHix_all_gg,
xHiDHiDHix_all_ee, xHiDHiDHix_all_ge, i1, j1, i2, j2,
yPDPDPy_gg, yPDPDPy_ee, yPDPDPy_ge);
// AI for REML.
if (func_name == 'R' || func_name == 'r') {
Calc_tracePDPD(eval, Qi, Hi, xHi, QixHiDHix_all_g, QixHiDHix_all_e,
xHiDHiDHix_all_gg, xHiDHiDHix_all_ee,
xHiDHiDHix_all_ge, i1, j1, i2, j2, tPDPD_gg,
tPDPD_ee, tPDPD_ge);
dev2_gg = 0.5 * tPDPD_gg - yPDPDPy_gg;
dev2_ee = 0.5 * tPDPD_ee - yPDPDPy_ee;
dev2_ge = 0.5 * tPDPD_ge - yPDPDPy_ge;
} else {
Calc_traceHiDHiD(eval, Hi, i1, j1, i2, j2, tHiDHiD_gg, tHiDHiD_ee,
tHiDHiD_ge);
dev2_gg = 0.5 * tHiDHiD_gg - yPDPDPy_gg;
dev2_ee = 0.5 * tHiDHiD_ee - yPDPDPy_ee;
dev2_ge = 0.5 * tHiDHiD_ge - yPDPDPy_ge;
}
// Set up Hessian.
gsl_matrix_set(Hessian, v1, v2, dev2_gg);
gsl_matrix_set(Hessian, v1 + v_size, v2 + v_size, dev2_ee);
gsl_matrix_set(Hessian, v1, v2 + v_size, dev2_ge);
gsl_matrix_set(Hessian, v2 + v_size, v1, dev2_ge);
if (v1 != v2) {
gsl_matrix_set(Hessian, v2, v1, dev2_gg);
gsl_matrix_set(Hessian, v2 + v_size, v1 + v_size, dev2_ee);
gsl_matrix_set(Hessian, v2, v1 + v_size, dev2_ge);
gsl_matrix_set(Hessian, v1 + v_size, v2, dev2_ge);
}
}
}
}
}
// Invert Hessian.
int sig;
gsl_permutation *pmt = gsl_permutation_alloc(v_size * 2);
LUDecomp(Hessian, pmt, &sig);
LUInvert(Hessian, pmt, Hessian_inv);
gsl_permutation_free(pmt);
gsl_matrix_free(Hessian);
// Calculate Edgeworth correction factors after inverting
// Hessian.
if (c_size > 1) {
CalcCRT(Hessian_inv, Qi, QixHiDHix_all_g, QixHiDHix_all_e,
xHiDHiDHix_all_gg, xHiDHiDHix_all_ee, xHiDHiDHix_all_ge, d_size,
crt_a, crt_b, crt_c);
} else {
crt_a = 0.0;
crt_b = 0.0;
crt_c = 0.0;
}
gsl_matrix_free(xHiDHiy_all_g);
gsl_matrix_free(xHiDHiy_all_e);
gsl_matrix_free(xHiDHix_all_g);
gsl_matrix_free(xHiDHix_all_e);
gsl_matrix_free(xHiDHixQixHiy_all_g);
gsl_matrix_free(xHiDHixQixHiy_all_e);
gsl_matrix_free(QixHiDHiy_all_g);
gsl_matrix_free(QixHiDHiy_all_e);
gsl_matrix_free(QixHiDHix_all_g);
gsl_matrix_free(QixHiDHix_all_e);
gsl_matrix_free(QixHiDHixQixHiy_all_g);
gsl_matrix_free(QixHiDHixQixHiy_all_e);
gsl_matrix_free(xHiDHiDHiy_all_gg);
gsl_matrix_free(xHiDHiDHiy_all_ee);
gsl_matrix_free(xHiDHiDHiy_all_ge);
gsl_matrix_free(xHiDHiDHix_all_gg);
gsl_matrix_free(xHiDHiDHix_all_ee);
gsl_matrix_free(xHiDHiDHix_all_ge);
return;
}
// Update Vg, Ve.
void UpdateVgVe(const gsl_matrix *Hessian_inv, const gsl_vector *gradient,
const double step_scale, gsl_matrix *V_g, gsl_matrix *V_e) {
size_t v_size = gradient->size / 2, d_size = V_g->size1;
size_t v;
gsl_vector *vec_v = gsl_vector_alloc(v_size * 2);
double d;
// Vectorize Vg and Ve.
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < d_size; j++) {
if (j < i) {
continue;
}
v = GetIndex(i, j, d_size);
d = gsl_matrix_get(V_g, i, j);
gsl_vector_set(vec_v, v, d);
d = gsl_matrix_get(V_e, i, j);
gsl_vector_set(vec_v, v + v_size, d);
}
}
gsl_blas_dgemv(CblasNoTrans, -1.0 * step_scale, Hessian_inv, gradient, 1.0,
vec_v);
// Save Vg and Ve.
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j < d_size; j++) {
if (j < i) {
continue;
}
v = GetIndex(i, j, d_size);
d = gsl_vector_get(vec_v, v);
gsl_matrix_set(V_g, i, j, d);
gsl_matrix_set(V_g, j, i, d);
d = gsl_vector_get(vec_v, v + v_size);
gsl_matrix_set(V_e, i, j, d);
gsl_matrix_set(V_e, j, i, d);
}
}
gsl_vector_free(vec_v);
return;
}
double MphNR(const char func_name, const size_t max_iter, const double max_prec,
const gsl_vector *eval, const gsl_matrix *X, const gsl_matrix *Y,
gsl_matrix *Hi_all, gsl_matrix *xHi_all, gsl_matrix *Hiy_all,
gsl_matrix *V_g, gsl_matrix *V_e, gsl_matrix *Hessian_inv,
double &crt_a, double &crt_b, double &crt_c) {
if (func_name != 'R' && func_name != 'L' && func_name != 'r' &&
func_name != 'l') {
cout << "func_name only takes 'R' or 'L': 'R' for log-restricted "
<< "likelihood, 'L' for log-likelihood." << endl;
return 0.0;
}
size_t n_size = eval->size, c_size = X->size1, d_size = Y->size1;
size_t dc_size = d_size * c_size;
size_t v_size = d_size * (d_size + 1) / 2;
double logdet_H, logdet_Q, yPy, logl_const;
double logl_old = 0.0, logl_new = 0.0, step_scale;
int sig;
size_t step_iter, flag_pd;
gsl_matrix *Vg_save = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *Ve_save = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_temp = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *U_temp = gsl_matrix_alloc(d_size, d_size);
gsl_vector *D_temp = gsl_vector_alloc(d_size);
gsl_vector *xHiy = gsl_vector_alloc(dc_size);
gsl_vector *QixHiy = gsl_vector_alloc(dc_size);
gsl_matrix *Qi = gsl_matrix_alloc(dc_size, dc_size);
gsl_matrix *XXt = gsl_matrix_alloc(c_size, c_size);
gsl_vector *gradient = gsl_vector_alloc(v_size * 2);
// Calculate |XXt| and (XXt)^{-1}.
gsl_blas_dsyrk(CblasUpper, CblasNoTrans, 1.0, X, 0.0, XXt);
for (size_t i = 0; i < c_size; ++i) {
for (size_t j = 0; j < i; ++j) {
gsl_matrix_set(XXt, i, j, gsl_matrix_get(XXt, j, i));
}
}
gsl_permutation *pmt = gsl_permutation_alloc(c_size);
LUDecomp(XXt, pmt, &sig);
gsl_permutation_free(pmt);
// Calculate the constant for logl.
if (func_name == 'R' || func_name == 'r') {
logl_const =
-0.5 * (double)(n_size - c_size) * (double)d_size * safe_log(2.0 * M_PI) +
0.5 * (double)d_size * LULndet(XXt);
} else {
logl_const = -0.5 * (double)n_size * (double)d_size * safe_log(2.0 * M_PI);
}
// Optimization iterations.
for (size_t t = 0; t < max_iter; t++) {
gsl_matrix_memcpy(Vg_save, V_g);
gsl_matrix_memcpy(Ve_save, V_e);
step_scale = 1.0;
step_iter = 0;
do {
gsl_matrix_memcpy(V_g, Vg_save);
gsl_matrix_memcpy(V_e, Ve_save);
// Update Vg, Ve, and invert Hessian.
if (t != 0) {
UpdateVgVe(Hessian_inv, gradient, step_scale, V_g, V_e);
}
// Check if both Vg and Ve are positive definite.
flag_pd = 1;
gsl_matrix_memcpy(V_temp, V_e);
EigenDecomp(V_temp, U_temp, D_temp, 0);
for (size_t i = 0; i < d_size; i++) {
if (gsl_vector_get(D_temp, i) <= 0) {
flag_pd = 0;
}
}
gsl_matrix_memcpy(V_temp, V_g);
EigenDecomp(V_temp, U_temp, D_temp, 0);
for (size_t i = 0; i < d_size; i++) {
if (gsl_vector_get(D_temp, i) <= 0) {
flag_pd = 0;
}
}
// If flag_pd==1, continue to calculate quantities
// and logl.
if (flag_pd == 1) {
CalcHiQi(eval, X, V_g, V_e, Hi_all, Qi, logdet_H, logdet_Q);
Calc_Hiy_all(Y, Hi_all, Hiy_all);
Calc_xHi_all(X, Hi_all, xHi_all);
// Calculate QixHiy and yPy.
Calc_xHiy(Y, xHi_all, xHiy);
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, xHiy, 0.0, QixHiy);
gsl_blas_ddot(QixHiy, xHiy, &yPy);
yPy = Calc_yHiy(Y, Hiy_all) - yPy;
// Calculate log likelihood/restricted likelihood value.
if (func_name == 'R' || func_name == 'r') {
logl_new = logl_const - 0.5 * logdet_H - 0.5 * logdet_Q - 0.5 * yPy;
} else {
logl_new = logl_const - 0.5 * logdet_H - 0.5 * yPy;
}
}
step_scale /= 2.0;
step_iter++;
} while (
(flag_pd == 0 || logl_new < logl_old || logl_new - logl_old > 10) &&
step_iter < 10 && t != 0);
// Terminate if change is small.
if (t != 0) {
if (logl_new < logl_old || flag_pd == 0) {
gsl_matrix_memcpy(V_g, Vg_save);
gsl_matrix_memcpy(V_e, Ve_save);
break;
}
if (logl_new - logl_old < max_prec) {
break;
}
}
logl_old = logl_new;
CalcDev(func_name, eval, Qi, Hi_all, xHi_all, Hiy_all, QixHiy, gradient,
Hessian_inv, crt_a, crt_b, crt_c);
}
// Mutiply Hessian_inv with -1.0.
// Now Hessian_inv is the variance matrix.
gsl_matrix_scale(Hessian_inv, -1.0);
gsl_matrix_free(Vg_save);
gsl_matrix_free(Ve_save);
gsl_matrix_free(V_temp);
gsl_matrix_free(U_temp);
gsl_vector_free(D_temp);
gsl_vector_free(xHiy);
gsl_vector_free(QixHiy);
gsl_matrix_free(Qi);
gsl_matrix_free(XXt);
gsl_vector_free(gradient);
return logl_new;
}
// Initialize Vg, Ve and B.
void MphInitial(const size_t em_iter, const double em_prec,
const size_t nr_iter, const double nr_prec,
const gsl_vector *eval, const gsl_matrix *X,
const gsl_matrix *Y, const double l_min, const double l_max,
const size_t n_region, gsl_matrix *V_g, gsl_matrix *V_e,
gsl_matrix *B) {
debug_msg("MphInitial");
write(Y, "Y in MphInitial");
gsl_matrix_set_zero(V_g);
gsl_matrix_set_zero(V_e);
gsl_matrix_set_zero(B);
size_t n_size = eval->size, c_size = X->size1, d_size = Y->size1;
double a, b, c;
double lambda, logl, vg, ve;
// Initialize the diagonal elements of Vg and Ve using univariate
// LMM and REML estimates.
gsl_matrix *Xt = gsl_matrix_alloc(n_size, c_size);
gsl_vector *beta_temp = gsl_vector_alloc(c_size);
gsl_vector *se_beta_temp = gsl_vector_alloc(c_size);
gsl_matrix_transpose_memcpy(Xt, X);
for (size_t i = 0; i < d_size; i++) {
gsl_vector_const_view Y_row = gsl_matrix_const_row(Y, i);
CalcLambda('R', eval, Xt, &Y_row.vector, l_min, l_max, n_region, lambda,
logl);
CalcLmmVgVeBeta(eval, Xt, &Y_row.vector, lambda, vg, ve, beta_temp,
se_beta_temp);
gsl_matrix_set(V_g, i, i, vg);
gsl_matrix_set(V_e, i, i, ve);
}
gsl_matrix_free(Xt);
gsl_vector_free(beta_temp);
gsl_vector_free(se_beta_temp);
// If number of phenotypes is above four, then obtain the off
// diagonal elements with two trait models.
if (d_size > 4) {
// First obtain good initial values.
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(2, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(2, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(2, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(2, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(2, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(2, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(2, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(2, n_size);
// Large matrices for NR. Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(2, 2 * n_size);
// Each column is H_k^{-1}y_k.
gsl_matrix *Hiy_all = gsl_matrix_alloc(2, n_size);
// Each dcxdc block is x_k\otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(2 * c_size, 2 * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(6, 6);
// 2 by n matrix of Y.
gsl_matrix *Y_sub = gsl_matrix_alloc(2, n_size);
gsl_matrix *Vg_sub = gsl_matrix_alloc(2, 2);
gsl_matrix *Ve_sub = gsl_matrix_alloc(2, 2);
gsl_matrix *B_sub = gsl_matrix_alloc(2, c_size);
for (size_t i = 0; i < d_size; i++) {
gsl_vector_view Y_sub1 = gsl_matrix_row(Y_sub, 0);
gsl_vector_const_view Y_1 = gsl_matrix_const_row(Y, i);
gsl_vector_memcpy(&Y_sub1.vector, &Y_1.vector);
for (size_t j = i + 1; j < d_size; j++) {
gsl_vector_view Y_sub2 = gsl_matrix_row(Y_sub, 1);
gsl_vector_const_view Y_2 = gsl_matrix_const_row(Y, j);
gsl_vector_memcpy(&Y_sub2.vector, &Y_2.vector);
gsl_matrix_set_zero(Vg_sub);
gsl_matrix_set_zero(Ve_sub);
gsl_matrix_set(Vg_sub, 0, 0, gsl_matrix_get(V_g, i, i));
gsl_matrix_set(Ve_sub, 0, 0, gsl_matrix_get(V_e, i, i));
gsl_matrix_set(Vg_sub, 1, 1, gsl_matrix_get(V_g, j, j));
gsl_matrix_set(Ve_sub, 1, 1, gsl_matrix_get(V_e, j, j));
logl = MphEM('R', em_iter, em_prec, eval, X, Y_sub, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE,
Vg_sub, Ve_sub, B_sub);
logl = MphNR('R', nr_iter, nr_prec, eval, X, Y_sub, Hi_all, xHi_all,
Hiy_all, Vg_sub, Ve_sub, Hessian, a, b, c);
gsl_matrix_set(V_g, i, j, gsl_matrix_get(Vg_sub, 0, 1));
gsl_matrix_set(V_g, j, i, gsl_matrix_get(Vg_sub, 0, 1));
gsl_matrix_set(V_e, i, j, ve = gsl_matrix_get(Ve_sub, 0, 1));
gsl_matrix_set(V_e, j, i, ve = gsl_matrix_get(Ve_sub, 0, 1));
}
}
// Free matrices.
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_matrix_free(Y_sub);
gsl_matrix_free(Vg_sub);
gsl_matrix_free(Ve_sub);
gsl_matrix_free(B_sub);
}
// Calculate B hat using GSL estimate.
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_vector *D_l = gsl_vector_alloc(d_size);
gsl_matrix *UltVeh = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *UltVehi = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *Qi = gsl_matrix_alloc(d_size * c_size, d_size * c_size);
gsl_vector *XHiy = gsl_vector_alloc(d_size * c_size);
gsl_vector *beta = gsl_vector_alloc(d_size * c_size);
gsl_vector_set_zero(XHiy);
double dl, d, delta, dx, dy;
// Eigen decomposition and calculate log|Ve|.
// double logdet_Ve = EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
EigenProc(V_g, V_e, D_l, UltVeh, UltVehi);
// Calculate Qi and log|Q|.
// double logdet_Q = CalcQi(eval, D_l, X, Qi);
CalcQi(eval, D_l, X, Qi);
// Calculate UltVehiY.
gsl_blas_dgemm(CblasNoTrans, CblasNoTrans, 1.0, UltVehi, Y, 0.0, UltVehiY);
// calculate XHiy
for (size_t i = 0; i < d_size; i++) {
dl = gsl_vector_get(D_l, i);
for (size_t j = 0; j < c_size; j++) {
d = 0.0;
for (size_t k = 0; k < n_size; k++) {
delta = gsl_vector_get(eval, k);
dx = gsl_matrix_get(X, j, k);
dy = gsl_matrix_get(UltVehiY, i, k);
d += dy * dx / (delta * dl + 1.0);
}
gsl_vector_set(XHiy, j * d_size + i, d);
}
}
gsl_blas_dgemv(CblasNoTrans, 1.0, Qi, XHiy, 0.0, beta);
// Multiply beta by UltVeh and save to B.
for (size_t i = 0; i < c_size; i++) {
gsl_vector_view B_col = gsl_matrix_column(B, i);
gsl_vector_view beta_sub = gsl_vector_subvector(beta, i * d_size, d_size);
gsl_blas_dgemv(CblasTrans, 1.0, UltVeh, &beta_sub.vector, 0.0,
&B_col.vector);
}
// Free memory.
gsl_matrix_free(UltVehiY);
gsl_vector_free(D_l);
gsl_matrix_free(UltVeh);
gsl_matrix_free(UltVehi);
gsl_matrix_free(Qi);
gsl_vector_free(XHiy);
gsl_vector_free(beta);
return;
}
// p-value correction
// mode=1 Wald; mode=2 LRT; mode=3 SCORE;
double PCRT(const size_t mode, const size_t d_size, const double p_value,
const double crt_a, const double crt_b, const double crt_c) {
double p_crt = 0.0, chisq_crt = 0.0, q = (double)d_size;
double chisq = gsl_cdf_chisq_Qinv(p_value, (double)d_size);
if (mode == 1) {
double a = crt_c / (2.0 * q * (q + 2.0));
double b = 1.0 + (crt_a + crt_b) / (2.0 * q);
chisq_crt = (-1.0 * b + safe_sqrt(b * b + 4.0 * a * chisq)) / (2.0 * a);
} else if (mode == 2) {
chisq_crt = chisq / (1.0 + crt_a / (2.0 * q));
} else {
chisq_crt = chisq;
}
p_crt = gsl_cdf_chisq_Q(chisq_crt, (double)d_size);
return p_crt;
}
void MVLMM::AnalyzeBimbam(const gsl_matrix *U, const gsl_vector *eval,
const gsl_matrix *UtW, const gsl_matrix *UtY) {
debug_msg("entering");
write(UtY, "UtY in AnalyzeBimbam");
igzstream infile(file_geno.c_str(), igzstream::in);
if (!infile) {
cout << "error reading genotype file:" << file_geno << endl;
return;
}
clock_t time_start = clock();
time_UtX = 0;
time_opt = 0;
string line;
char *ch_ptr;
double logl_H0 = 0.0, logl_H1 = 0.0, p_wald = 0, p_lrt = 0, p_score = 0;
double crt_a, crt_b, crt_c;
int n_miss, c_phen;
double geno, x_mean;
size_t c = 0;
size_t n_size = UtY->size1, d_size = UtY->size2, c_size = UtW->size2;
size_t dc_size = d_size * (c_size + 1), v_size = d_size * (d_size + 1) / 2;
// Create a large matrix.
size_t msize = LMM_BATCH_SIZE;
gsl_matrix *Xlarge = gsl_matrix_alloc(U->size1, msize);
gsl_matrix *UtXlarge = gsl_matrix_alloc(U->size1, msize);
gsl_matrix_set_zero(Xlarge);
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(d_size, n_size);
// Large matrices for NR.
// Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(d_size, d_size * n_size);
// Each column is H_k^{-1}y_k.
gsl_matrix *Hiy_all = gsl_matrix_alloc(d_size, n_size);
// Each dcxdc block is x_k \otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(dc_size, d_size * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
gsl_vector *x = gsl_vector_alloc(n_size);
gsl_vector *x_miss = gsl_vector_alloc(n_size);
gsl_matrix *Y = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *X = gsl_matrix_alloc(c_size + 1, n_size);
gsl_matrix *V_g = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B = gsl_matrix_alloc(d_size, c_size + 1);
gsl_vector *beta = gsl_vector_alloc(d_size);
gsl_matrix *Vbeta = gsl_matrix_alloc(d_size, d_size);
// Null estimates for initial values.
gsl_matrix *V_g_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B_null = gsl_matrix_alloc(d_size, c_size + 1);
gsl_matrix *se_B_null = gsl_matrix_alloc(d_size, c_size);
gsl_matrix_view X_sub = gsl_matrix_submatrix(X, 0, 0, c_size, n_size);
gsl_matrix_view B_sub = gsl_matrix_submatrix(B, 0, 0, d_size, c_size);
gsl_matrix_view xHi_all_sub =
gsl_matrix_submatrix(xHi_all, 0, 0, d_size * c_size, d_size * n_size);
gsl_matrix_transpose_memcpy(Y, UtY);
gsl_matrix_transpose_memcpy(&X_sub.matrix, UtW);
gsl_vector_view X_row = gsl_matrix_row(X, c_size);
gsl_vector_set_zero(&X_row.vector);
gsl_vector_view B_col = gsl_matrix_column(B, c_size);
gsl_vector_set_zero(&B_col.vector);
MphInitial(em_iter, em_prec, nr_iter, nr_prec, eval, &X_sub.matrix, Y, l_min,
l_max, n_region, V_g, V_e, &B_sub.matrix);
logl_H0 = MphEM('R', em_iter, em_prec, eval, &X_sub.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub.matrix);
logl_H0 = MphNR('R', nr_iter, nr_prec, eval, &X_sub.matrix, Y, Hi_all,
&xHi_all_sub.matrix, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b,
crt_c);
MphCalcBeta(eval, &X_sub.matrix, Y, V_g, V_e, UltVehiY, &B_sub.matrix,
se_B_null);
c = 0;
Vg_remle_null.clear();
Ve_remle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_remle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_remle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_remle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_remle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_remle_null.clear();
se_beta_remle_null.clear();
for (size_t i = 0; i < se_B_null->size1; i++) {
for (size_t j = 0; j < se_B_null->size2; j++) {
beta_remle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_remle_null.push_back(gsl_matrix_get(se_B_null, i, j));
}
}
logl_remle_H0 = logl_H0;
cout.setf(std::ios_base::fixed, std::ios_base::floatfield);
cout.precision(4);
cout << "REMLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "REMLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "REMLE likelihood = " << logl_H0 << endl;
logl_H0 = MphEM('L', em_iter, em_prec, eval, &X_sub.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub.matrix);
logl_H0 = MphNR('L', nr_iter, nr_prec, eval, &X_sub.matrix, Y, Hi_all,
&xHi_all_sub.matrix, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b,
crt_c);
MphCalcBeta(eval, &X_sub.matrix, Y, V_g, V_e, UltVehiY, &B_sub.matrix,
se_B_null);
c = 0;
Vg_mle_null.clear();
Ve_mle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_mle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_mle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_mle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_mle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_mle_null.clear();
se_beta_mle_null.clear();
for (size_t i = 0; i < se_B_null->size1; i++) {
for (size_t j = 0; j < se_B_null->size2; j++) {
beta_mle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_mle_null.push_back(gsl_matrix_get(se_B_null, i, j));
}
}
logl_mle_H0 = logl_H0;
cout << "MLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "MLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "MLE likelihood = " << logl_H0 << endl;
vector v_beta, v_Vg, v_Ve, v_Vbeta;
for (size_t i = 0; i < d_size; i++) {
v_beta.push_back(0.0);
}
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg.push_back(0.0);
v_Ve.push_back(0.0);
v_Vbeta.push_back(0.0);
}
}
gsl_matrix_memcpy(V_g_null, V_g);
gsl_matrix_memcpy(V_e_null, V_e);
gsl_matrix_memcpy(B_null, B);
// Start reading genotypes and analyze.
size_t csnp = 0, t_last = 0;
for (size_t t = 0; t < indicator_snp.size(); ++t) {
if (indicator_snp[t] == 0) {
continue;
}
t_last++;
}
for (size_t t = 0; t < indicator_snp.size(); ++t) {
safeGetline(infile, line).eof();
if (t % d_pace == 0 || t == (ns_total - 1)) {
ProgressBar("Reading SNPs", t, ns_total - 1);
}
if (indicator_snp[t] == 0) {
continue;
}
ch_ptr = strtok_safe((char *)line.c_str(), " , \t");
ch_ptr = strtok_safe(NULL, " , \t");
ch_ptr = strtok_safe(NULL, " , \t");
x_mean = 0.0;
c_phen = 0;
n_miss = 0;
gsl_vector_set_zero(x_miss);
for (size_t i = 0; i < ni_total; ++i) {
ch_ptr = strtok_safe(NULL, " , \t");
if (indicator_idv[i] == 0) {
continue;
}
if (strcmp(ch_ptr, "NA") == 0) {
gsl_vector_set(x_miss, c_phen, 0.0);
n_miss++;
} else {
geno = atof(ch_ptr);
gsl_vector_set(x, c_phen, geno);
gsl_vector_set(x_miss, c_phen, 1.0);
x_mean += geno;
}
c_phen++;
}
x_mean /= (double)(ni_test - n_miss);
for (size_t i = 0; i < ni_test; ++i) {
if (gsl_vector_get(x_miss, i) == 0) {
gsl_vector_set(x, i, x_mean);
}
geno = gsl_vector_get(x, i);
}
gsl_vector_view Xlarge_col = gsl_matrix_column(Xlarge, csnp % msize);
gsl_vector_memcpy(&Xlarge_col.vector, x);
csnp++;
if (csnp % msize == 0 || csnp == t_last) {
size_t l = 0;
if (csnp % msize == 0) {
l = msize;
} else {
l = csnp % msize;
}
gsl_matrix_view Xlarge_sub =
gsl_matrix_submatrix(Xlarge, 0, 0, Xlarge->size1, l);
gsl_matrix_view UtXlarge_sub =
gsl_matrix_submatrix(UtXlarge, 0, 0, UtXlarge->size1, l);
time_start = clock();
fast_dgemm("T", "N", 1.0, U, &Xlarge_sub.matrix, 0.0,
&UtXlarge_sub.matrix);
time_UtX += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
gsl_matrix_set_zero(Xlarge);
for (size_t i = 0; i < l; i++) {
gsl_vector_view UtXlarge_col = gsl_matrix_column(UtXlarge, i);
gsl_vector_memcpy(&X_row.vector, &UtXlarge_col.vector);
// Initial values.
gsl_matrix_memcpy(V_g, V_g_null);
gsl_matrix_memcpy(V_e, V_e_null);
gsl_matrix_memcpy(B, B_null);
time_start = clock();
// 3 is before 1.
if (a_mode == 3 || a_mode == 4) {
p_score = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g_null,
V_e_null, UltVehiY, beta, Vbeta);
if (p_score < p_nr && crt == 1) {
logl_H1 = MphNR('R', 1, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_score = PCRT(3, d_size, p_score, crt_a, crt_b, crt_c);
}
}
if (a_mode == 2 || a_mode == 4) {
logl_H1 = MphEM('L', em_iter / 10, em_prec * 10, eval, X, Y, U_hat,
E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU,
UltVehiE, V_g, V_e, B);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (p_lrt < p_nr) {
logl_H1 =
MphNR('L', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all,
xHi_all, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (crt == 1) {
p_lrt = PCRT(2, d_size, p_lrt, crt_a, crt_b, crt_c);
}
}
}
if (a_mode == 1 || a_mode == 4) {
logl_H1 = MphEM('R', em_iter / 10, em_prec * 10, eval, X, Y, U_hat,
E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU,
UltVehiE, V_g, V_e, B);
p_wald = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (p_wald < p_nr) {
logl_H1 =
MphNR('R', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all,
xHi_all, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_wald = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (crt == 1) {
p_wald = PCRT(1, d_size, p_wald, crt_a, crt_b, crt_c);
}
}
}
time_opt += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// Store summary data.
for (size_t i = 0; i < d_size; i++) {
v_beta[i] = gsl_vector_get(beta, i);
}
c = 0;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg[c] = gsl_matrix_get(V_g, i, j);
v_Ve[c] = gsl_matrix_get(V_e, i, j);
v_Vbeta[c] = gsl_matrix_get(Vbeta, i, j);
c++;
}
}
MPHSUMSTAT SNPs = {v_beta, p_wald, p_lrt, p_score, v_Vg, v_Ve, v_Vbeta};
sumStat.push_back(SNPs);
}
}
}
cout << endl;
infile.close();
infile.clear();
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_vector_free(x);
gsl_vector_free(x_miss);
gsl_matrix_free(Y);
gsl_matrix_free(X);
gsl_matrix_free(V_g);
gsl_matrix_free(V_e);
gsl_matrix_free(B);
gsl_vector_free(beta);
gsl_matrix_free(Vbeta);
gsl_matrix_free(V_g_null);
gsl_matrix_free(V_e_null);
gsl_matrix_free(B_null);
gsl_matrix_free(se_B_null);
gsl_matrix_free(Xlarge);
gsl_matrix_free(UtXlarge);
return;
}
void MVLMM::AnalyzePlink(const gsl_matrix *U, const gsl_vector *eval,
const gsl_matrix *UtW, const gsl_matrix *UtY) {
debug_msg("entering");
string file_bed = file_bfile + ".bed";
ifstream infile(file_bed.c_str(), ios::binary);
if (!infile) {
cout << "error reading bed file:" << file_bed << endl;
return;
}
clock_t time_start = clock();
time_UtX = 0;
time_opt = 0;
char ch[1];
bitset<8> b;
double logl_H0 = 0.0, logl_H1 = 0.0, p_wald = 0, p_lrt = 0, p_score = 0;
double crt_a, crt_b, crt_c;
int n_bit, n_miss, ci_total, ci_test;
double geno, x_mean;
size_t c = 0;
size_t n_size = UtY->size1, d_size = UtY->size2, c_size = UtW->size2;
size_t dc_size = d_size * (c_size + 1), v_size = d_size * (d_size + 1) / 2;
// Create a large matrix.
size_t msize = LMM_BATCH_SIZE;
gsl_matrix *Xlarge = gsl_matrix_alloc(U->size1, msize);
gsl_matrix *UtXlarge = gsl_matrix_alloc(U->size1, msize);
gsl_matrix_set_zero(Xlarge);
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(d_size, n_size);
// Large matrices for NR.
// Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(d_size, d_size * n_size);
// Each column is H_k^{-1}y_k.
gsl_matrix *Hiy_all = gsl_matrix_alloc(d_size, n_size);
// Each dcxdc block is x_k\otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(dc_size, d_size * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
gsl_vector *x = gsl_vector_alloc(n_size);
gsl_matrix *Y = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *X = gsl_matrix_alloc(c_size + 1, n_size);
gsl_matrix *V_g = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B = gsl_matrix_alloc(d_size, c_size + 1);
gsl_vector *beta = gsl_vector_alloc(d_size);
gsl_matrix *Vbeta = gsl_matrix_alloc(d_size, d_size);
// Null estimates for initial values.
gsl_matrix *V_g_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B_null = gsl_matrix_alloc(d_size, c_size + 1);
gsl_matrix *se_B_null = gsl_matrix_alloc(d_size, c_size);
gsl_matrix_view X_sub = gsl_matrix_submatrix(X, 0, 0, c_size, n_size);
gsl_matrix_view B_sub = gsl_matrix_submatrix(B, 0, 0, d_size, c_size);
gsl_matrix_view xHi_all_sub =
gsl_matrix_submatrix(xHi_all, 0, 0, d_size * c_size, d_size * n_size);
gsl_matrix_transpose_memcpy(Y, UtY);
gsl_matrix_transpose_memcpy(&X_sub.matrix, UtW);
gsl_vector_view X_row = gsl_matrix_row(X, c_size);
gsl_vector_set_zero(&X_row.vector);
gsl_vector_view B_col = gsl_matrix_column(B, c_size);
gsl_vector_set_zero(&B_col.vector);
MphInitial(em_iter, em_prec, nr_iter, nr_prec, eval, &X_sub.matrix, Y, l_min,
l_max, n_region, V_g, V_e, &B_sub.matrix);
write(eval,"eval4");
logl_H0 = MphEM('R', em_iter, em_prec, eval, &X_sub.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub.matrix);
logl_H0 = MphNR('R', nr_iter, nr_prec, eval, &X_sub.matrix, Y, Hi_all,
&xHi_all_sub.matrix, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b,
crt_c);
MphCalcBeta(eval, &X_sub.matrix, Y, V_g, V_e, UltVehiY, &B_sub.matrix,
se_B_null);
c = 0;
Vg_remle_null.clear();
Ve_remle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_remle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_remle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_remle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_remle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_remle_null.clear();
se_beta_remle_null.clear();
for (size_t i = 0; i < se_B_null->size1; i++) {
for (size_t j = 0; j < se_B_null->size2; j++) {
beta_remle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_remle_null.push_back(gsl_matrix_get(se_B_null, i, j));
}
}
logl_remle_H0 = logl_H0;
cout.setf(std::ios_base::fixed, std::ios_base::floatfield);
cout.precision(4);
cout << "REMLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "REMLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
auto v = gsl_matrix_get(Hessian, c + v_size, c + v_size);
if (is_strict_mode())
enforce_msg(v >= 0,"se(Ve) is not valid");
cout << safe_sqrt(v) << "\t";
}
cout << endl;
}
cout << "REMLE likelihood = " << logl_H0 << endl;
logl_H0 = MphEM('L', em_iter, em_prec, eval, &X_sub.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub.matrix);
logl_H0 = MphNR('L', nr_iter, nr_prec, eval, &X_sub.matrix, Y, Hi_all,
&xHi_all_sub.matrix, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b,
crt_c);
MphCalcBeta(eval, &X_sub.matrix, Y, V_g, V_e, UltVehiY, &B_sub.matrix,
se_B_null);
c = 0;
Vg_mle_null.clear();
Ve_mle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_mle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_mle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_mle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_mle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_mle_null.clear();
se_beta_mle_null.clear();
for (size_t i = 0; i < se_B_null->size1; i++) {
for (size_t j = 0; j < se_B_null->size2; j++) {
beta_mle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_mle_null.push_back(gsl_matrix_get(se_B_null, i, j));
}
}
logl_mle_H0 = logl_H0;
cout << "MLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "MLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
auto v = gsl_matrix_get(Hessian, c + v_size, c + v_size);
if (is_strict_mode())
enforce_msg(v >= 0,"se(Ve) is not valid");
cout << safe_sqrt(v) << "\t";
}
cout << endl;
}
cout << "MLE likelihood = " << logl_H0 << endl;
vector v_beta, v_Vg, v_Ve, v_Vbeta;
for (size_t i = 0; i < d_size; i++) {
v_beta.push_back(0.0);
}
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg.push_back(0.0);
v_Ve.push_back(0.0);
v_Vbeta.push_back(0.0);
}
}
gsl_matrix_memcpy(V_g_null, V_g);
gsl_matrix_memcpy(V_e_null, V_e);
gsl_matrix_memcpy(B_null, B);
// Start reading genotypes and analyze.
// Calculate n_bit and c, the number of bit for each snp.
if (ni_total % 4 == 0) {
n_bit = ni_total / 4;
} else {
n_bit = ni_total / 4 + 1;
}
// Print the first three magic numbers.
for (int i = 0; i < 3; ++i) {
infile.read(ch, 1);
b = ch[0];
}
size_t csnp = 0, t_last = 0;
for (size_t t = 0; t < indicator_snp.size(); ++t) {
if (indicator_snp[t] == 0) {
continue;
}
t_last++;
}
for (vector::size_type t = 0; t < snpInfo.size(); ++t) {
// cout << snpInfo[t].rs_number << endl;
if (t % d_pace == 0 || t == snpInfo.size() - 1) {
ProgressBar("Reading SNPs", t, snpInfo.size() - 1);
}
if (indicator_snp[t] == 0) {
continue;
}
// n_bit, and 3 is the number of magic numbers.
infile.seekg(t * n_bit + 3);
// read genotypes
x_mean = 0.0;
n_miss = 0;
ci_total = 0;
ci_test = 0;
for (int i = 0; i < n_bit; ++i) {
infile.read(ch, 1);
b = ch[0];
// Minor allele homozygous: 2.0; major: 0.0;
for (size_t j = 0; j < 4; ++j) {
if ((i == (n_bit - 1)) && ci_total == (int)ni_total) {
break;
}
if (indicator_idv[ci_total] == 0) {
ci_total++;
continue;
}
if (b[2 * j] == 0) {
if (b[2 * j + 1] == 0) {
gsl_vector_set(x, ci_test, 2);
x_mean += 2.0;
} else {
gsl_vector_set(x, ci_test, 1);
x_mean += 1.0;
}
} else {
if (b[2 * j + 1] == 1) {
gsl_vector_set(x, ci_test, 0);
} else {
gsl_vector_set(x, ci_test, -9);
n_miss++;
}
}
ci_total++;
ci_test++;
}
}
x_mean /= (double)(ni_test - n_miss);
for (size_t i = 0; i < ni_test; ++i) {
geno = gsl_vector_get(x, i);
if (geno == -9) {
gsl_vector_set(x, i, x_mean);
geno = x_mean;
}
}
gsl_vector_view Xlarge_col = gsl_matrix_column(Xlarge, csnp % msize);
gsl_vector_memcpy(&Xlarge_col.vector, x);
csnp++;
if (csnp % msize == 0 || csnp == t_last) {
size_t l = 0;
if (csnp % msize == 0) {
l = msize;
} else {
l = csnp % msize;
}
gsl_matrix_view Xlarge_sub =
gsl_matrix_submatrix(Xlarge, 0, 0, Xlarge->size1, l);
gsl_matrix_view UtXlarge_sub =
gsl_matrix_submatrix(UtXlarge, 0, 0, UtXlarge->size1, l);
time_start = clock();
fast_dgemm("T", "N", 1.0, U, &Xlarge_sub.matrix, 0.0,
&UtXlarge_sub.matrix);
time_UtX += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
gsl_matrix_set_zero(Xlarge);
for (size_t i = 0; i < l; i++) {
// double t = (double(clock()-time_start)/(double(CLOCKS_PER_SEC)));
// printf("%.2f ",t);
// if (i>10) exit(1);
// cout << i << "," << l << endl;
gsl_vector_view UtXlarge_col = gsl_matrix_column(UtXlarge, i);
gsl_vector_memcpy(&X_row.vector, &UtXlarge_col.vector);
// Initial values.
gsl_matrix_memcpy(V_g, V_g_null);
gsl_matrix_memcpy(V_e, V_e_null);
gsl_matrix_memcpy(B, B_null);
time_start = clock();
// 3 is before 1.
if (a_mode == 3 || a_mode == 4) {
p_score = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g_null,
V_e_null, UltVehiY, beta, Vbeta);
if (p_score < p_nr && crt == 1) {
logl_H1 = MphNR('R', 1, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_score = PCRT(3, d_size, p_score, crt_a, crt_b, crt_c);
}
}
if (a_mode == 2 || a_mode == 4) {
logl_H1 = MphEM('L', em_iter / 10, em_prec * 10, eval, X, Y, U_hat,
E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU,
UltVehiE, V_g, V_e, B);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (p_lrt < p_nr) {
logl_H1 =
MphNR('L', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all,
xHi_all, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (crt == 1) {
p_lrt = PCRT(2, d_size, p_lrt, crt_a, crt_b, crt_c);
}
}
}
if (a_mode == 1 || a_mode == 4) {
logl_H1 = MphEM('R', em_iter / 10, em_prec * 10, eval, X, Y, U_hat,
E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU,
UltVehiE, V_g, V_e, B);
p_wald = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (p_wald < p_nr) {
logl_H1 =
MphNR('R', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all,
xHi_all, Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_wald = MphCalcP(eval, &X_row.vector, &X_sub.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (crt == 1) {
p_wald = PCRT(1, d_size, p_wald, crt_a, crt_b, crt_c);
}
}
}
time_opt += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// Store summary data.
for (size_t i = 0; i < d_size; i++) {
v_beta[i] = gsl_vector_get(beta, i);
}
c = 0;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg[c] = gsl_matrix_get(V_g, i, j);
v_Ve[c] = gsl_matrix_get(V_e, i, j);
v_Vbeta[c] = gsl_matrix_get(Vbeta, i, j);
c++;
}
}
MPHSUMSTAT SNPs = {v_beta, p_wald, p_lrt, p_score, v_Vg, v_Ve, v_Vbeta};
sumStat.push_back(SNPs);
}
}
}
cout << endl;
infile.close();
infile.clear();
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_vector_free(x);
gsl_matrix_free(Y);
gsl_matrix_free(X);
gsl_matrix_free(V_g);
gsl_matrix_free(V_e);
gsl_matrix_free(B);
gsl_vector_free(beta);
gsl_matrix_free(Vbeta);
gsl_matrix_free(V_g_null);
gsl_matrix_free(V_e_null);
gsl_matrix_free(B_null);
gsl_matrix_free(se_B_null);
gsl_matrix_free(Xlarge);
gsl_matrix_free(UtXlarge);
return;
}
// Calculate Vg, Ve, B, se(B) in the null mvLMM model.
// Both B and se_B are d by c matrices.
void CalcMvLmmVgVeBeta(const gsl_vector *eval, const gsl_matrix *UtW,
const gsl_matrix *UtY, const size_t em_iter,
const size_t nr_iter, const double em_prec,
const double nr_prec, const double l_min,
const double l_max, const size_t n_region,
gsl_matrix *V_g, gsl_matrix *V_e, gsl_matrix *B,
gsl_matrix *se_B) {
size_t n_size = UtY->size1, d_size = UtY->size2, c_size = UtW->size2;
size_t dc_size = d_size * c_size, v_size = d_size * (d_size + 1) / 2;
double crt_a, crt_b, crt_c;
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(d_size, n_size);
// Large matrices for NR.
// Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(d_size, d_size * n_size);
// Each column is H_k^{-1}y_k.
gsl_matrix *Hiy_all = gsl_matrix_alloc(d_size, n_size);
// Each dcxdc block is x_k\otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(dc_size, d_size * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
// Transpose matrices.
gsl_matrix *Y = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *W = gsl_matrix_alloc(c_size, n_size);
gsl_matrix_transpose_memcpy(Y, UtY);
gsl_matrix_transpose_memcpy(W, UtW);
// Initial, EM, NR, and calculate B.
MphInitial(em_iter, em_prec, nr_iter, nr_prec, eval, W, Y, l_min, l_max,
n_region, V_g, V_e, B);
MphEM('R', em_iter, em_prec, eval, W, Y, U_hat, E_hat, OmegaU, OmegaE,
UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g, V_e, B);
MphNR('R', nr_iter, nr_prec, eval, W, Y, Hi_all, xHi_all, Hiy_all, V_g,
V_e, Hessian, crt_a, crt_b, crt_c);
MphCalcBeta(eval, W, Y, V_g, V_e, UltVehiY, B, se_B);
// Free matrices.
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_matrix_free(Y);
gsl_matrix_free(W);
return;
}
void MVLMM::AnalyzeBimbamGXE(const gsl_matrix *U, const gsl_vector *eval,
const gsl_matrix *UtW, const gsl_matrix *UtY,
const gsl_vector *env) {
debug_msg("entering");
igzstream infile(file_geno.c_str(), igzstream::in);
if (!infile) {
cout << "error reading genotype file:" << file_geno << endl;
return;
}
clock_t time_start = clock();
time_UtX = 0;
time_opt = 0;
string line;
char *ch_ptr;
double logl_H0 = 0.0, logl_H1 = 0.0, p_wald = 0, p_lrt = 0, p_score = 0;
double crt_a, crt_b, crt_c;
int n_miss, c_phen;
double geno, x_mean;
size_t c = 0;
size_t n_size = UtY->size1, d_size = UtY->size2, c_size = UtW->size2 + 2;
size_t dc_size = d_size * (c_size + 1), v_size = d_size * (d_size + 1) / 2;
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(d_size, n_size);
// Large matrices for NR.
// Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(d_size, d_size * n_size);
// Each column is H_k^{-1}y_k.
gsl_matrix *Hiy_all = gsl_matrix_alloc(d_size, n_size);
// Each dcxdc block is x_k\otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(dc_size, d_size * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
gsl_vector *x = gsl_vector_alloc(n_size);
gsl_vector *x_miss = gsl_vector_alloc(n_size);
gsl_matrix *Y = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *X = gsl_matrix_alloc(c_size + 1, n_size);
gsl_matrix *V_g = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B = gsl_matrix_alloc(d_size, c_size + 1);
gsl_vector *beta = gsl_vector_alloc(d_size);
gsl_matrix *Vbeta = gsl_matrix_alloc(d_size, d_size);
// Null estimates for initial values; including env but not
// including x.
gsl_matrix *V_g_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B_null = gsl_matrix_alloc(d_size, c_size + 1);
gsl_matrix *se_B_null1 = gsl_matrix_alloc(d_size, c_size - 1);
gsl_matrix *se_B_null2 = gsl_matrix_alloc(d_size, c_size);
gsl_matrix_view X_sub1 = gsl_matrix_submatrix(X, 0, 0, c_size - 1, n_size);
gsl_matrix_view B_sub1 = gsl_matrix_submatrix(B, 0, 0, d_size, c_size - 1);
gsl_matrix_view xHi_all_sub1 = gsl_matrix_submatrix(
xHi_all, 0, 0, d_size * (c_size - 1), d_size * n_size);
gsl_matrix_view X_sub2 = gsl_matrix_submatrix(X, 0, 0, c_size, n_size);
gsl_matrix_view B_sub2 = gsl_matrix_submatrix(B, 0, 0, d_size, c_size);
gsl_matrix_view xHi_all_sub2 =
gsl_matrix_submatrix(xHi_all, 0, 0, d_size * c_size, d_size * n_size);
gsl_matrix_transpose_memcpy(Y, UtY);
gsl_matrix_view X_sub0 = gsl_matrix_submatrix(X, 0, 0, c_size - 2, n_size);
gsl_matrix_transpose_memcpy(&X_sub0.matrix, UtW);
gsl_vector_view X_row0 = gsl_matrix_row(X, c_size - 2);
gsl_blas_dgemv(CblasTrans, 1.0, U, env, 0.0, &X_row0.vector);
gsl_vector_view X_row1 = gsl_matrix_row(X, c_size - 1);
gsl_vector_set_zero(&X_row1.vector);
gsl_vector_view X_row2 = gsl_matrix_row(X, c_size);
gsl_vector_set_zero(&X_row2.vector);
gsl_vector_view B_col1 = gsl_matrix_column(B, c_size - 1);
gsl_vector_set_zero(&B_col1.vector);
gsl_vector_view B_col2 = gsl_matrix_column(B, c_size);
gsl_vector_set_zero(&B_col2.vector);
MphInitial(em_iter, em_prec, nr_iter, nr_prec, eval, &X_sub1.matrix, Y, l_min,
l_max, n_region, V_g, V_e, &B_sub1.matrix);
logl_H0 = MphEM('R', em_iter, em_prec, eval, &X_sub1.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub1.matrix);
logl_H0 = MphNR('R', nr_iter, nr_prec, eval, &X_sub1.matrix, Y, Hi_all,
&xHi_all_sub1.matrix, Hiy_all, V_g, V_e, Hessian, crt_a,
crt_b, crt_c);
MphCalcBeta(eval, &X_sub1.matrix, Y, V_g, V_e, UltVehiY, &B_sub1.matrix,
se_B_null1);
c = 0;
Vg_remle_null.clear();
Ve_remle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_remle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_remle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_remle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_remle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_remle_null.clear();
se_beta_remle_null.clear();
for (size_t i = 0; i < se_B_null1->size1; i++) {
for (size_t j = 0; j < se_B_null1->size2; j++) {
beta_remle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_remle_null.push_back(gsl_matrix_get(se_B_null1, i, j));
}
}
logl_remle_H0 = logl_H0;
cout.setf(std::ios_base::fixed, std::ios_base::floatfield);
cout.precision(4);
cout << "REMLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "REMLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "REMLE likelihood = " << logl_H0 << endl;
logl_H0 = MphEM('L', em_iter, em_prec, eval, &X_sub1.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub1.matrix);
logl_H0 = MphNR('L', nr_iter, nr_prec, eval, &X_sub1.matrix, Y, Hi_all,
&xHi_all_sub1.matrix, Hiy_all, V_g, V_e, Hessian, crt_a,
crt_b, crt_c);
MphCalcBeta(eval, &X_sub1.matrix, Y, V_g, V_e, UltVehiY, &B_sub1.matrix,
se_B_null1);
c = 0;
Vg_mle_null.clear();
Ve_mle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_mle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_mle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_mle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_mle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_mle_null.clear();
se_beta_mle_null.clear();
for (size_t i = 0; i < se_B_null1->size1; i++) {
for (size_t j = 0; j < se_B_null1->size2; j++) {
beta_mle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_mle_null.push_back(gsl_matrix_get(se_B_null1, i, j));
}
}
logl_mle_H0 = logl_H0;
cout << "MLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "MLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "MLE likelihood = " << logl_H0 << endl;
vector v_beta, v_Vg, v_Ve, v_Vbeta;
for (size_t i = 0; i < d_size; i++) {
v_beta.push_back(0.0);
}
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg.push_back(0.0);
v_Ve.push_back(0.0);
v_Vbeta.push_back(0.0);
}
}
gsl_matrix_memcpy(V_g_null, V_g);
gsl_matrix_memcpy(V_e_null, V_e);
gsl_matrix_memcpy(B_null, B);
// Start reading genotypes and analyze.
for (size_t t = 0; t < indicator_snp.size(); ++t) {
safeGetline(infile, line).eof();
if (t % d_pace == 0 || t == (ns_total - 1)) {
ProgressBar("Reading SNPs", t, ns_total - 1);
}
if (indicator_snp[t] == 0) {
continue;
}
ch_ptr = strtok_safe((char *)line.c_str(), " , \t");
ch_ptr = strtok_safe(NULL, " , \t");
ch_ptr = strtok_safe(NULL, " , \t");
x_mean = 0.0;
c_phen = 0;
n_miss = 0;
gsl_vector_set_zero(x_miss);
for (size_t i = 0; i < ni_total; ++i) {
ch_ptr = strtok_safe(NULL, " , \t");
if (indicator_idv[i] == 0) {
continue;
}
if (strcmp(ch_ptr, "NA") == 0) {
gsl_vector_set(x_miss, c_phen, 0.0);
n_miss++;
} else {
geno = atof(ch_ptr);
gsl_vector_set(x, c_phen, geno);
gsl_vector_set(x_miss, c_phen, 1.0);
x_mean += geno;
}
c_phen++;
}
x_mean /= (double)(ni_test - n_miss);
for (size_t i = 0; i < ni_test; ++i) {
if (gsl_vector_get(x_miss, i) == 0) {
gsl_vector_set(x, i, x_mean);
}
geno = gsl_vector_get(x, i);
if (x_mean > 1) {
gsl_vector_set(x, i, 2 - geno);
}
}
// Calculate statistics.
time_start = clock();
gsl_blas_dgemv(CblasTrans, 1.0, U, x, 0.0, &X_row1.vector);
gsl_vector_mul(x, env);
gsl_blas_dgemv(CblasTrans, 1.0, U, x, 0.0, &X_row2.vector);
time_UtX += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// initial values
gsl_matrix_memcpy(V_g, V_g_null);
gsl_matrix_memcpy(V_e, V_e_null);
gsl_matrix_memcpy(B, B_null);
if (a_mode == 2 || a_mode == 3 || a_mode == 4) {
if (a_mode == 3 || a_mode == 4) {
logl_H0 = MphEM('R', em_iter / 10, em_prec * 10, eval, &X_sub2.matrix,
Y, U_hat, E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX,
UltVehiU, UltVehiE, V_g, V_e, &B_sub2.matrix);
logl_H0 = MphNR('R', nr_iter / 10, nr_prec * 10, eval, &X_sub2.matrix,
Y, Hi_all, &xHi_all_sub2.matrix, Hiy_all, V_g, V_e,
Hessian, crt_a, crt_b, crt_c);
MphCalcBeta(eval, &X_sub2.matrix, Y, V_g, V_e, UltVehiY, &B_sub2.matrix,
se_B_null2);
}
if (a_mode == 2 || a_mode == 4) {
logl_H0 = MphEM('L', em_iter / 10, em_prec * 10, eval, &X_sub2.matrix,
Y, U_hat, E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX,
UltVehiU, UltVehiE, V_g, V_e, &B_sub2.matrix);
logl_H0 = MphNR('L', nr_iter / 10, nr_prec * 10, eval, &X_sub2.matrix,
Y, Hi_all, &xHi_all_sub2.matrix, Hiy_all, V_g, V_e,
Hessian, crt_a, crt_b, crt_c);
MphCalcBeta(eval, &X_sub2.matrix, Y, V_g, V_e, UltVehiY, &B_sub2.matrix,
se_B_null2);
}
}
time_start = clock();
// 3 is before 1.
if (a_mode == 3 || a_mode == 4) {
p_score = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g_null,
V_e_null, UltVehiY, beta, Vbeta);
if (p_score < p_nr && crt == 1) {
logl_H1 = MphNR('R', 1, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_score = PCRT(3, d_size, p_score, crt_a, crt_b, crt_c);
}
}
if (a_mode == 2 || a_mode == 4) {
logl_H1 = MphEM('L', em_iter / 10, em_prec * 10, eval, X, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE,
V_g, V_e, B);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (p_lrt < p_nr) {
logl_H1 =
MphNR('L', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (crt == 1) {
p_lrt = PCRT(2, d_size, p_lrt, crt_a, crt_b, crt_c);
}
}
}
if (a_mode == 1 || a_mode == 4) {
logl_H1 = MphEM('R', em_iter / 10, em_prec * 10, eval, X, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE,
V_g, V_e, B);
p_wald = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (p_wald < p_nr) {
logl_H1 =
MphNR('R', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_wald = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (crt == 1) {
p_wald = PCRT(1, d_size, p_wald, crt_a, crt_b, crt_c);
}
}
}
if (x_mean > 1) {
gsl_vector_scale(beta, -1.0);
}
time_opt += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// Store summary data.
for (size_t i = 0; i < d_size; i++) {
v_beta[i] = gsl_vector_get(beta, i);
}
c = 0;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg[c] = gsl_matrix_get(V_g, i, j);
v_Ve[c] = gsl_matrix_get(V_e, i, j);
v_Vbeta[c] = gsl_matrix_get(Vbeta, i, j);
c++;
}
}
MPHSUMSTAT SNPs = {v_beta, p_wald, p_lrt, p_score, v_Vg, v_Ve, v_Vbeta};
sumStat.push_back(SNPs);
}
cout << endl;
infile.close();
infile.clear();
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_vector_free(x);
gsl_vector_free(x_miss);
gsl_matrix_free(Y);
gsl_matrix_free(X);
gsl_matrix_free(V_g);
gsl_matrix_free(V_e);
gsl_matrix_free(B);
gsl_vector_free(beta);
gsl_matrix_free(Vbeta);
gsl_matrix_free(V_g_null);
gsl_matrix_free(V_e_null);
gsl_matrix_free(B_null);
gsl_matrix_free(se_B_null1);
gsl_matrix_free(se_B_null2);
return;
}
void MVLMM::AnalyzePlinkGXE(const gsl_matrix *U, const gsl_vector *eval,
const gsl_matrix *UtW, const gsl_matrix *UtY,
const gsl_vector *env) {
debug_msg("entering");
string file_bed = file_bfile + ".bed";
ifstream infile(file_bed.c_str(), ios::binary);
if (!infile) {
cout << "error reading bed file:" << file_bed << endl;
return;
}
clock_t time_start = clock();
time_UtX = 0;
time_opt = 0;
char ch[1];
bitset<8> b;
double logl_H0 = 0.0, logl_H1 = 0.0, p_wald = 0, p_lrt = 0, p_score = 0;
double crt_a, crt_b, crt_c;
int n_bit, n_miss, ci_total, ci_test;
double geno, x_mean;
size_t c = 0;
size_t n_size = UtY->size1, d_size = UtY->size2, c_size = UtW->size2 + 2;
size_t dc_size = d_size * (c_size + 1), v_size = d_size * (d_size + 1) / 2;
// Large matrices for EM.
gsl_matrix *U_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *E_hat = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *OmegaE = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiY = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiBX = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiU = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *UltVehiE = gsl_matrix_alloc(d_size, n_size);
// Large matrices for NR.
// Each dxd block is H_k^{-1}.
gsl_matrix *Hi_all = gsl_matrix_alloc(d_size, d_size * n_size);
// Each column is H_k^{-1}y_k
gsl_matrix *Hiy_all = gsl_matrix_alloc(d_size, n_size);
// Each dcxdc block is x_k\otimes H_k^{-1}.
gsl_matrix *xHi_all = gsl_matrix_alloc(dc_size, d_size * n_size);
gsl_matrix *Hessian = gsl_matrix_alloc(v_size * 2, v_size * 2);
gsl_vector *x = gsl_vector_alloc(n_size);
gsl_matrix *Y = gsl_matrix_alloc(d_size, n_size);
gsl_matrix *X = gsl_matrix_alloc(c_size + 1, n_size);
gsl_matrix *V_g = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B = gsl_matrix_alloc(d_size, c_size + 1);
gsl_vector *beta = gsl_vector_alloc(d_size);
gsl_matrix *Vbeta = gsl_matrix_alloc(d_size, d_size);
// Null estimates for initial values.
gsl_matrix *V_g_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *V_e_null = gsl_matrix_alloc(d_size, d_size);
gsl_matrix *B_null = gsl_matrix_alloc(d_size, c_size + 1);
gsl_matrix *se_B_null1 = gsl_matrix_alloc(d_size, c_size - 1);
gsl_matrix *se_B_null2 = gsl_matrix_alloc(d_size, c_size);
gsl_matrix_view X_sub1 = gsl_matrix_submatrix(X, 0, 0, c_size - 1, n_size);
gsl_matrix_view B_sub1 = gsl_matrix_submatrix(B, 0, 0, d_size, c_size - 1);
gsl_matrix_view xHi_all_sub1 = gsl_matrix_submatrix(
xHi_all, 0, 0, d_size * (c_size - 1), d_size * n_size);
gsl_matrix_view X_sub2 = gsl_matrix_submatrix(X, 0, 0, c_size, n_size);
gsl_matrix_view B_sub2 = gsl_matrix_submatrix(B, 0, 0, d_size, c_size);
gsl_matrix_view xHi_all_sub2 =
gsl_matrix_submatrix(xHi_all, 0, 0, d_size * c_size, d_size * n_size);
gsl_matrix_transpose_memcpy(Y, UtY);
gsl_matrix_view X_sub0 = gsl_matrix_submatrix(X, 0, 0, c_size - 2, n_size);
gsl_matrix_transpose_memcpy(&X_sub0.matrix, UtW);
gsl_vector_view X_row0 = gsl_matrix_row(X, c_size - 2);
gsl_blas_dgemv(CblasTrans, 1.0, U, env, 0.0, &X_row0.vector);
gsl_vector_view X_row1 = gsl_matrix_row(X, c_size - 1);
gsl_vector_set_zero(&X_row1.vector);
gsl_vector_view X_row2 = gsl_matrix_row(X, c_size);
gsl_vector_set_zero(&X_row2.vector);
gsl_vector_view B_col1 = gsl_matrix_column(B, c_size - 1);
gsl_vector_set_zero(&B_col1.vector);
gsl_vector_view B_col2 = gsl_matrix_column(B, c_size);
gsl_vector_set_zero(&B_col2.vector);
MphInitial(em_iter, em_prec, nr_iter, nr_prec, eval, &X_sub1.matrix, Y, l_min,
l_max, n_region, V_g, V_e, &B_sub1.matrix);
logl_H0 = MphEM('R', em_iter, em_prec, eval, &X_sub1.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub1.matrix);
logl_H0 = MphNR('R', nr_iter, nr_prec, eval, &X_sub1.matrix, Y, Hi_all,
&xHi_all_sub1.matrix, Hiy_all, V_g, V_e, Hessian, crt_a,
crt_b, crt_c);
MphCalcBeta(eval, &X_sub1.matrix, Y, V_g, V_e, UltVehiY, &B_sub1.matrix,
se_B_null1);
c = 0;
Vg_remle_null.clear();
Ve_remle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_remle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_remle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_remle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_remle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_remle_null.clear();
se_beta_remle_null.clear();
for (size_t i = 0; i < se_B_null1->size1; i++) {
for (size_t j = 0; j < se_B_null1->size2; j++) {
beta_remle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_remle_null.push_back(gsl_matrix_get(se_B_null1, i, j));
}
}
logl_remle_H0 = logl_H0;
cout.setf(std::ios_base::fixed, std::ios_base::floatfield);
cout.precision(4);
cout << "REMLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "REMLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "REMLE likelihood = " << logl_H0 << endl;
logl_H0 = MphEM('L', em_iter, em_prec, eval, &X_sub1.matrix, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE, V_g,
V_e, &B_sub1.matrix);
logl_H0 = MphNR('L', nr_iter, nr_prec, eval, &X_sub1.matrix, Y, Hi_all,
&xHi_all_sub1.matrix, Hiy_all, V_g, V_e, Hessian, crt_a,
crt_b, crt_c);
MphCalcBeta(eval, &X_sub1.matrix, Y, V_g, V_e, UltVehiY, &B_sub1.matrix,
se_B_null1);
c = 0;
Vg_mle_null.clear();
Ve_mle_null.clear();
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
Vg_mle_null.push_back(gsl_matrix_get(V_g, i, j));
Ve_mle_null.push_back(gsl_matrix_get(V_e, i, j));
VVg_mle_null.push_back(gsl_matrix_get(Hessian, c, c));
VVe_mle_null.push_back(gsl_matrix_get(Hessian, c + v_size, c + v_size));
c++;
}
}
beta_mle_null.clear();
se_beta_mle_null.clear();
for (size_t i = 0; i < se_B_null1->size1; i++) {
for (size_t j = 0; j < se_B_null1->size2; j++) {
beta_mle_null.push_back(gsl_matrix_get(B, i, j));
se_beta_mle_null.push_back(gsl_matrix_get(se_B_null1, i, j));
}
}
logl_mle_H0 = logl_H0;
cout << "MLE estimate for Vg in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_g, i, j) << "\t";
}
cout << endl;
}
cout << "se(Vg): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c, c)) << "\t";
}
cout << endl;
}
cout << "MLE estimate for Ve in the null model: " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
cout << gsl_matrix_get(V_e, i, j) << "\t";
}
cout << endl;
}
cout << "se(Ve): " << endl;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = 0; j <= i; j++) {
c = GetIndex(i, j, d_size);
cout << safe_sqrt(gsl_matrix_get(Hessian, c + v_size, c + v_size)) << "\t";
}
cout << endl;
}
cout << "MLE likelihood = " << logl_H0 << endl;
vector v_beta, v_Vg, v_Ve, v_Vbeta;
for (size_t i = 0; i < d_size; i++) {
v_beta.push_back(0.0);
}
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg.push_back(0.0);
v_Ve.push_back(0.0);
v_Vbeta.push_back(0.0);
}
}
gsl_matrix_memcpy(V_g_null, V_g);
gsl_matrix_memcpy(V_e_null, V_e);
gsl_matrix_memcpy(B_null, B);
// Start reading genotypes and analyze.
// Calculate n_bit and c, the number of bit for each SNP.
if (ni_total % 4 == 0) {
n_bit = ni_total / 4;
} else {
n_bit = ni_total / 4 + 1;
}
// Print the first three magic numbers.
for (int i = 0; i < 3; ++i) {
infile.read(ch, 1);
b = ch[0];
}
for (vector::size_type t = 0; t < snpInfo.size(); ++t) {
if (t % d_pace == 0 || t == snpInfo.size() - 1) {
ProgressBar("Reading SNPs", t, snpInfo.size() - 1);
}
if (indicator_snp[t] == 0) {
continue;
}
// n_bit, and 3 is the number of magic numbers.
infile.seekg(t * n_bit + 3);
// Read genotypes.
x_mean = 0.0;
n_miss = 0;
ci_total = 0;
ci_test = 0;
for (int i = 0; i < n_bit; ++i) {
infile.read(ch, 1);
b = ch[0];
// Minor allele homozygous: 2.0; major: 0.0.
for (size_t j = 0; j < 4; ++j) {
if ((i == (n_bit - 1)) && ci_total == (int)ni_total) {
break;
}
if (indicator_idv[ci_total] == 0) {
ci_total++;
continue;
}
if (b[2 * j] == 0) {
if (b[2 * j + 1] == 0) {
gsl_vector_set(x, ci_test, 2);
x_mean += 2.0;
} else {
gsl_vector_set(x, ci_test, 1);
x_mean += 1.0;
}
} else {
if (b[2 * j + 1] == 1) {
gsl_vector_set(x, ci_test, 0);
} else {
gsl_vector_set(x, ci_test, -9);
n_miss++;
}
}
ci_total++;
ci_test++;
}
}
x_mean /= (double)(ni_test - n_miss);
for (size_t i = 0; i < ni_test; ++i) {
geno = gsl_vector_get(x, i);
if (geno == -9) {
gsl_vector_set(x, i, x_mean);
geno = x_mean;
}
if (x_mean > 1) {
gsl_vector_set(x, i, 2 - geno);
}
}
// Calculate statistics.
time_start = clock();
gsl_blas_dgemv(CblasTrans, 1.0, U, x, 0.0, &X_row1.vector);
gsl_vector_mul(x, env);
gsl_blas_dgemv(CblasTrans, 1.0, U, x, 0.0, &X_row2.vector);
time_UtX += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// Initial values.
gsl_matrix_memcpy(V_g, V_g_null);
gsl_matrix_memcpy(V_e, V_e_null);
gsl_matrix_memcpy(B, B_null);
if (a_mode == 2 || a_mode == 3 || a_mode == 4) {
if (a_mode == 3 || a_mode == 4) {
logl_H0 = MphEM('R', em_iter / 10, em_prec * 10, eval, &X_sub2.matrix,
Y, U_hat, E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX,
UltVehiU, UltVehiE, V_g, V_e, &B_sub2.matrix);
logl_H0 = MphNR('R', nr_iter / 10, nr_prec * 10, eval, &X_sub2.matrix,
Y, Hi_all, &xHi_all_sub2.matrix, Hiy_all, V_g, V_e,
Hessian, crt_a, crt_b, crt_c);
MphCalcBeta(eval, &X_sub2.matrix, Y, V_g, V_e, UltVehiY, &B_sub2.matrix,
se_B_null2);
}
if (a_mode == 2 || a_mode == 4) {
logl_H0 = MphEM('L', em_iter / 10, em_prec * 10, eval, &X_sub2.matrix,
Y, U_hat, E_hat, OmegaU, OmegaE, UltVehiY, UltVehiBX,
UltVehiU, UltVehiE, V_g, V_e, &B_sub2.matrix);
logl_H0 = MphNR('L', nr_iter / 10, nr_prec * 10, eval, &X_sub2.matrix,
Y, Hi_all, &xHi_all_sub2.matrix, Hiy_all, V_g, V_e,
Hessian, crt_a, crt_b, crt_c);
MphCalcBeta(eval, &X_sub2.matrix, Y, V_g, V_e, UltVehiY, &B_sub2.matrix,
se_B_null2);
}
}
time_start = clock();
// 3 is before 1.
if (a_mode == 3 || a_mode == 4) {
p_score = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g_null,
V_e_null, UltVehiY, beta, Vbeta);
if (p_score < p_nr && crt == 1) {
logl_H1 = MphNR('R', 1, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_score = PCRT(3, d_size, p_score, crt_a, crt_b, crt_c);
}
}
if (a_mode == 2 || a_mode == 4) {
logl_H1 = MphEM('L', em_iter / 10, em_prec * 10, eval, X, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE,
V_g, V_e, B);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (p_lrt < p_nr) {
logl_H1 =
MphNR('L', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
// Calculate beta and Vbeta.
p_lrt = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
p_lrt = gsl_cdf_chisq_Q(2.0 * (logl_H1 - logl_H0), (double)d_size);
if (crt == 1) {
p_lrt = PCRT(2, d_size, p_lrt, crt_a, crt_b, crt_c);
}
}
}
if (a_mode == 1 || a_mode == 4) {
logl_H1 = MphEM('R', em_iter / 10, em_prec * 10, eval, X, Y, U_hat, E_hat,
OmegaU, OmegaE, UltVehiY, UltVehiBX, UltVehiU, UltVehiE,
V_g, V_e, B);
p_wald = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (p_wald < p_nr) {
logl_H1 =
MphNR('R', nr_iter / 10, nr_prec * 10, eval, X, Y, Hi_all, xHi_all,
Hiy_all, V_g, V_e, Hessian, crt_a, crt_b, crt_c);
p_wald = MphCalcP(eval, &X_row2.vector, &X_sub2.matrix, Y, V_g, V_e,
UltVehiY, beta, Vbeta);
if (crt == 1) {
p_wald = PCRT(1, d_size, p_wald, crt_a, crt_b, crt_c);
}
}
}
if (x_mean > 1) {
gsl_vector_scale(beta, -1.0);
}
time_opt += (clock() - time_start) / (double(CLOCKS_PER_SEC) * 60.0);
// Store summary data.
for (size_t i = 0; i < d_size; i++) {
v_beta[i] = gsl_vector_get(beta, i);
}
c = 0;
for (size_t i = 0; i < d_size; i++) {
for (size_t j = i; j < d_size; j++) {
v_Vg[c] = gsl_matrix_get(V_g, i, j);
v_Ve[c] = gsl_matrix_get(V_e, i, j);
v_Vbeta[c] = gsl_matrix_get(Vbeta, i, j);
c++;
}
}
MPHSUMSTAT SNPs = {v_beta, p_wald, p_lrt, p_score, v_Vg, v_Ve, v_Vbeta};
sumStat.push_back(SNPs);
}
cout << endl;
infile.close();
infile.clear();
gsl_matrix_free(U_hat);
gsl_matrix_free(E_hat);
gsl_matrix_free(OmegaU);
gsl_matrix_free(OmegaE);
gsl_matrix_free(UltVehiY);
gsl_matrix_free(UltVehiBX);
gsl_matrix_free(UltVehiU);
gsl_matrix_free(UltVehiE);
gsl_matrix_free(Hi_all);
gsl_matrix_free(Hiy_all);
gsl_matrix_free(xHi_all);
gsl_matrix_free(Hessian);
gsl_vector_free(x);
gsl_matrix_free(Y);
gsl_matrix_free(X);
gsl_matrix_free(V_g);
gsl_matrix_free(V_e);
gsl_matrix_free(B);
gsl_vector_free(beta);
gsl_matrix_free(Vbeta);
gsl_matrix_free(V_g_null);
gsl_matrix_free(V_e_null);
gsl_matrix_free(B_null);
gsl_matrix_free(se_B_null1);
gsl_matrix_free(se_B_null2);
return;
}