HPhi/doxygen/mltply_m_p_i_spin_core_8c_source.html

 /* HPhi  -  Quantum Lattice Model Simulator */
 /* Copyright (C) 2015 The University of Tokyo */

 /* This program is free software: you can redistribute it and/or modify */
 /* it under the terms of the GNU General Public License as published by */
 /* the Free Software Foundation, either version 3 of the License, or */
 /* (at your option) any later version. */

 /* This program is distributed in the hope that it will be useful, */
 /* but WITHOUT ANY WARRANTY; without even the implied warranty of */
 /* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the */
 /* GNU General Public License for more details. */

 /* You should have received a copy of the GNU General Public License */
 /* along with this program.  If not, see <http://www.gnu.org/licenses/>. */
 #ifdef MPI
 #include "mpi.h"
 #endif
 #include "Common.h"
 #include "mltplyCommon.h"
 #include "mltplySpinCore.h"
 #include "mltplyMPISpinCore.h"
 #include "bitcalc.h"
 #include "wrapperMPI.h"
 void GC_child_CisAitCiuAiv_spin_MPIdouble(
   unsigned long int i_int ,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
   double complex *tmp_v1 )
 {
 #ifdef MPI
   double complex dam_pr;
   dam_pr =  X_GC_child_CisAitCiuAiv_spin_MPIdouble(
     X->Def.InterAll_OffDiagonal[i_int][0],  X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][3],  X->Def.InterAll_OffDiagonal[i_int][4],
     X->Def.InterAll_OffDiagonal[i_int][5],  X->Def.InterAll_OffDiagonal[i_int][7],
     X->Def.ParaInterAll_OffDiagonal[i_int],X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIdouble*/
 double complex X_GC_child_CisAitCiuAiv_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask1, mask2, state1, state2, ierr, origin;
   unsigned long int idim_max_buf, j;
   MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;

   mask1 = (int)X->Def.Tpow[org_isite1];
   mask2 = (int)X->Def.Tpow[org_isite3];
   if (org_isite1 != org_isite3) {
     origin = myrank ^ (mask1 + mask2);
   }
   else {
     if (org_ispin1 == org_ispin4 && org_ispin2 == org_ispin3) { //CisAitCitAis=CisAis
       dam_pr = X_GC_child_CisAis_spin_MPIdouble(org_isite1, org_ispin1, tmp_J, X, tmp_v0, tmp_v1);
       return (dam_pr);
     }
     else { //CisAitCisAit=0
       return 0.0;
     }
   }

   state1 = (origin & mask1) / mask1;
   state2 = (origin & mask2) / mask2;

   if (state1 == org_ispin2 && state2 == org_ispin4) {
     Jint = tmp_J;
   }
   else if (state1 == org_ispin1 && state2 == org_ispin3) {
     Jint = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) {
       Jint = 0;
     }
   }
   else {
     return 0;
   }

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf, idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv) \
   firstprivate(idim_max_buf, Jint, X) shared(v1buf, tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         dmv = Jint * v1buf[j];
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         dmv = Jint * v1buf[j];
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIdouble*/
 void GC_child_CisAisCjuAjv_spin_MPIdouble(
   unsigned long int i_int ,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
   double complex *tmp_v1
 ){
 #ifdef MPI
   double complex dam_pr;
   dam_pr = X_GC_child_CisAisCjuAjv_spin_MPIdouble(
     X->Def.InterAll_OffDiagonal[i_int][0], X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][4], X->Def.InterAll_OffDiagonal[i_int][5],
     X->Def.InterAll_OffDiagonal[i_int][7], X->Def.ParaInterAll_OffDiagonal[i_int], X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIdouble*/
 double complex X_GC_child_CisAisCjuAjv_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask1, mask2, state2, ierr;
   long int origin, num1;
   unsigned long int idim_max_buf, j;
   MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;

   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin4) {//CisAisCitAis
       return 0.0;
   }

   mask1 = (int)X->Def.Tpow[org_isite1];
   mask2 = (int)X->Def.Tpow[org_isite3];
   origin = myrank ^ mask2;
   state2 = (origin & mask2) / mask2;
   num1 = X_SpinGC_CisAis((unsigned long int) myrank + 1, X, mask1, org_ispin1);
   if (num1 != 0 && state2 == org_ispin4) {
     Jint = tmp_J;
   }
   else if (X_SpinGC_CisAis(origin + 1, X, mask1, org_ispin1) == TRUE && state2 == org_ispin3) {
     Jint = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) Jint = 0;
   }
   else {
     return 0.0;
   }

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
   if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp parallel for default(none) reduction(+:dam_pr) private(j, dmv) \
   firstprivate(idim_max_buf, Jint, X) shared(v1buf, tmp_v1, tmp_v0)
     for (j = 1; j <= idim_max_buf; j++) {
       dmv = Jint * v1buf[j];
       tmp_v0[j] += dmv;
       dam_pr += conj(tmp_v1[j]) * dmv;
     }
   }
   else {
 #pragma omp parallel for default(none) reduction(+:dam_pr) private(j, dmv) \
   firstprivate(idim_max_buf, Jint, X) shared(v1buf, tmp_v1, tmp_v0)
     for (j = 1; j <= idim_max_buf; j++) {
       dmv = Jint * v1buf[j];
       dam_pr += conj(tmp_v1[j]) * dmv;
     }
   }
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAjv_spin_MPIdouble*/
 void GC_child_CisAitCjuAju_spin_MPIdouble(
   unsigned long int i_int,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 )
 {
 #ifdef MPI
   double complex dam_pr;
   dam_pr = X_GC_child_CisAitCjuAju_spin_MPIdouble(
     X->Def.InterAll_OffDiagonal[i_int][0], X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][3], X->Def.InterAll_OffDiagonal[i_int][4],
     X->Def.InterAll_OffDiagonal[i_int][5], X->Def.ParaInterAll_OffDiagonal[i_int], X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIdouble*/
 double complex X_GC_child_CisAitCjuAju_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask1, mask2, state1, ierr, num1;
   long int origin;
   unsigned long int idim_max_buf, j;
   MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;

   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin3) {//cisaitcisais
     return 0.0;
   }

   mask1 = (int)X->Def.Tpow[org_isite1];
   origin = myrank ^ mask1;
   state1 = (origin & mask1) / mask1;
   mask2 = (int)X->Def.Tpow[org_isite3];
   num1 = X_SpinGC_CisAis(origin + 1, X, mask2, org_ispin3);
   if (state1 == org_ispin2) {
     if (num1 != 0) {
       Jint = tmp_J;
     }
     else {
       return 0.0;
     }
   }/*if (state1 == org_ispin2)*/
   else {//state1 = org_ispin1
     num1 = X_SpinGC_CisAis((unsigned long int) myrank + 1, X, mask2, org_ispin3);
     if (num1 != 0) {
       Jint = conj(tmp_J);
       if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) {
         Jint = 0;
       }
     }
     else {
       return 0.0;
     }
   }

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv) \
   firstprivate(idim_max_buf, Jint, X) shared(v1buf, tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         dmv = Jint * v1buf[j];
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         dmv = Jint * v1buf[j];
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAjv_spin_MPIdouble*/
 double complex X_GC_child_CisAisCjuAju_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   long unsigned int mask1, mask2, num1,num2;
   unsigned long int  j;
 //  MPI_Status statusMPI;
   double complex dmv, dam_pr;
   mask1 = (int)X->Def.Tpow[org_isite1];
   mask2 = (int)X->Def.Tpow[org_isite3];
   num1 = X_SpinGC_CisAis((unsigned long int)myrank + 1, X, mask1, org_ispin1);
   num2 = X_SpinGC_CisAis((unsigned long int)myrank + 1, X, mask2, org_ispin3);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv) \
   firstprivate(tmp_J, X, num1, num2) shared(tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = num1*num2*tmp_v1[j] * tmp_J;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++) */
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = num1 * num2 * tmp_v1[j] * tmp_J;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return(dam_pr);
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAju_spin_MPIdouble*/
 double complex X_GC_child_CisAisCjuAju_spin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   long unsigned int mask1, mask2, num1, num2;
   unsigned long int j;
 //  MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;
   Jint = tmp_J;
   mask1 = (int)X->Def.Tpow[org_isite1];
   mask2 = (int)X->Def.Tpow[org_isite3];
   num2 = X_SpinGC_CisAis((unsigned long int) myrank + 1, X, mask2, org_ispin3);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv, num1) \
   firstprivate(Jint, X, num2, mask1, org_ispin1) shared(tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = X_SpinGC_CisAis(j, X, mask1, org_ispin1);
         dmv = Jint * num1 * num2 * tmp_v1[j];
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = X_SpinGC_CisAis(j, X, mask1, org_ispin1);
         dmv = Jint * num1 * num2 * tmp_v1[j];
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAju_spin_MPIdouble*/
 void GC_child_CisAitCiuAiv_spin_MPIsingle(
   unsigned long int i_int,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   double complex dam_pr;
   dam_pr =X_GC_child_CisAitCiuAiv_spin_MPIsingle(
     X->Def.InterAll_OffDiagonal[i_int][0], X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][3], X->Def.InterAll_OffDiagonal[i_int][4],
     X->Def.InterAll_OffDiagonal[i_int][5], X->Def.InterAll_OffDiagonal[i_int][7],
     X->Def.ParaInterAll_OffDiagonal[i_int], X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIsingle*/
 double complex X_GC_child_CisAitCiuAiv_spin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask2, state2, ierr, origin;
   unsigned long int mask1, idim_max_buf, j, ioff, state1, state1check;
   MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;
   /*
   Prepare index in the inter PE
   */
   mask2 = (int)X->Def.Tpow[org_isite3];
   origin = myrank ^ mask2;
   state2 = (origin & mask2) / mask2;

   if (state2 == org_ispin4) {
     state1check = (unsigned long int) org_ispin2;
     Jint = tmp_J;
   }
   else if (state2 == org_ispin3) {
     state1check = (unsigned long int) org_ispin1;
     Jint = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) {
       Jint = 0;
     }
   }
   else return 0.0;

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   /*
   Index in the intra PE
   */
   mask1 = X->Def.Tpow[org_isite1];

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv, state1, ioff) \
   firstprivate(idim_max_buf, Jint, X, state1check, mask1) shared(v1buf, tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 0; j < idim_max_buf; j++) {
         state1 = X_SpinGC_CisAit(j + 1, X, mask1, state1check, &ioff);
         if (state1 != 0) {
           dmv = Jint * v1buf[j + 1];
           tmp_v0[ioff + 1] += dmv;
           dam_pr += conj(tmp_v1[ioff + 1]) * dmv;
         }/*if (state1 != 0)*/
       }/*for (j = 0; j < idim_max_buf; j++)*/
     }
     else {
 #pragma omp for
       for (j = 0; j < idim_max_buf; j++) {
         state1 = X_SpinGC_CisAit(j + 1, X, mask1, state1check, &ioff);
         if (state1 != 0) {
           dmv = Jint * v1buf[j + 1];
           dam_pr += conj(tmp_v1[ioff + 1]) * dmv;
         }/*if (state1 != 0)*/
       }/*for (j = 0; j < idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIsingle*/
 void GC_child_CisAisCjuAjv_spin_MPIsingle(
   unsigned long int i_int,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   double complex dam_pr;
   dam_pr =X_GC_child_CisAisCjuAjv_spin_MPIsingle(
     X->Def.InterAll_OffDiagonal[i_int][0], X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][4], X->Def.InterAll_OffDiagonal[i_int][5],
     X->Def.InterAll_OffDiagonal[i_int][7], X->Def.ParaInterAll_OffDiagonal[i_int], X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAisCjuAjv_spin_MPIsingle*/
 double complex X_GC_child_CisAisCjuAjv_spin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask2, state2, ierr, origin;
   unsigned long int mask1, idim_max_buf, j, state1, state1check;
   MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;
   /*
   Prepare index in the inter PE
   */
   mask2 = (int)X->Def.Tpow[org_isite3];
   origin = myrank ^ mask2;
   state2 = (origin & mask2) / mask2;
   if (state2 == org_ispin4) {
     state1check = (unsigned long int) org_ispin1;
     Jint = tmp_J;
   }
   else if (state2 == org_ispin3) {
     state1check = (unsigned long int) org_ispin1;
     Jint = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) {
       Jint = 0;
     }
   }
   else return 0.0;

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   /*
   Index in the intra PE
   */
   mask1 = X->Def.Tpow[org_isite1];

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv, state1) \
   firstprivate(idim_max_buf, Jint, X, state1check, mask1) shared(v1buf, tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
       for (j = 0; j < idim_max_buf; j++) {
         state1 = (j & mask1) / mask1;
         if (state1 == state1check) {
           dmv = Jint * v1buf[j + 1];
           tmp_v0[j + 1] += dmv;
           dam_pr += conj(tmp_v1[j + 1]) * dmv;
         }/*if (state1 == state1check)*/
       }/*for (j = 0; j < idim_max_buf; j++)*/
     }
     else {
       for (j = 0; j < idim_max_buf; j++) {
         state1 = (j & mask1) / mask1;
         if (state1 == state1check) {
           dmv = Jint * v1buf[j + 1];
           dam_pr += conj(tmp_v1[j + 1]) * dmv;
         }/*if (state1 == state1check)*/
       }/*for (j = 0; j < idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIsingle*/
 void GC_child_CisAitCjuAju_spin_MPIsingle(
   unsigned long int i_int,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   double complex dam_pr;
   dam_pr =X_GC_child_CisAitCjuAju_spin_MPIsingle(
     X->Def.InterAll_OffDiagonal[i_int][0], X->Def.InterAll_OffDiagonal[i_int][1],
     X->Def.InterAll_OffDiagonal[i_int][3], X->Def.InterAll_OffDiagonal[i_int][4],
     X->Def.InterAll_OffDiagonal[i_int][5], X->Def.ParaInterAll_OffDiagonal[i_int], X, tmp_v0, tmp_v1);
   X->Large.prdct += dam_pr;
 #endif
 }/*void GC_child_CisAisCjuAjv_spin_MPIsingle*/
 double complex X_GC_child_CisAitCjuAju_spin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   int mask2, state2;
   unsigned long int mask1, j, ioff, state1, state1check;
   //MPI_Status statusMPI;
   double complex Jint, dmv, dam_pr;
   /*
   Prepare index in the inter PE
   */
   mask2 = (int)X->Def.Tpow[org_isite3];
   state2 = (myrank & mask2) / mask2;

   if (state2 == org_ispin3) {
     state1check = org_ispin2;
     Jint = tmp_J;
   }
   else {
     return 0.0;
   }

   mask1 = (int)X->Def.Tpow[org_isite1];

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv, state1, ioff) \
   firstprivate(Jint, X, state1check, mask1) shared(tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 0; j < X->Check.idim_max; j++) {

         state1 = (j & mask1) / mask1;
         ioff = j ^ mask1;
         if (state1 == state1check) {
           dmv = Jint * tmp_v1[j + 1];
         }
         else {
           dmv = conj(Jint) * tmp_v1[j + 1];
         }
         tmp_v0[ioff + 1] += dmv;
         dam_pr += conj(tmp_v1[ioff + 1]) * dmv;
       }/*for (j = 0; j < X->Check.idim_max; j++)*/
     }
     else if (X->Large.mode == M_CORR) {
 #pragma omp for
       for (j = 0; j < X->Check.idim_max; j++) {

         state1 = (j & mask1) / mask1;
         ioff = j ^ mask1;
         if (state1 == state1check) {
           dmv = Jint * tmp_v1[j + 1];
         }
         else {
           dmv = 0.0;
         }
         dam_pr += conj(tmp_v1[ioff + 1]) * dmv;
       }/*for (j = 0; j < X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 0; j < X->Check.idim_max; j++) {
         state1 = (j & mask1) / mask1;
         ioff = j ^ mask1;
         if (state1 == state1check) {
           dmv = Jint * tmp_v1[j + 1];
         }
         else {
           dmv = conj(Jint) * tmp_v1[j + 1];
         }
         dam_pr += conj(tmp_v1[ioff + 1]) * dmv;
       }/*for (j = 0; j < X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*void GC_child_CisAitCiuAiv_spin_MPIsingle*/
 double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int off, j;
   int origin, ierr;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;
   int ihermite = TRUE;
   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin4) {//cisaisciuais=0 && cisaiucisais=0
     return 0.0;
   }

   if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite3 + 1, org_ispin4, org_ispin3,
     &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     if (BitCheckGeneral(off, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
       tmp_V = tmp_J;
     }
     else {
       ihermite = FALSE;
     }
   }
   else {
     ihermite = FALSE;
   }

   if (ihermite == FALSE) {
     if (BitCheckGeneral((unsigned long int) myrank, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow) ==
       TRUE &&
       GetOffCompGeneralSpin((unsigned long int) myrank, org_isite3 + 1, org_ispin3, org_ispin4, &off,
         X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
       tmp_V = conj(tmp_J);
       if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
     }
     else {
       return 0.0;
     }
   }
   origin = (int)off;
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) \
 private(j, dmv) shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int j, off;
   int origin, ierr;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin3) {//cisaitcisais=0 && cisaiscitais=0
     return 0.0;
   }

   if (BitCheckGeneral((unsigned long int) myrank, org_isite3 + 1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow) == TRUE
     && GetOffCompGeneralSpin((unsigned long int) myrank, org_isite1 + 1, org_ispin2, org_ispin1,
       &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     tmp_V = tmp_J;
   }
   else if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite1 + 1, org_ispin1, org_ispin2, &off,
                                    X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     if (BitCheckGeneral(off, org_isite3 + 1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
       tmp_V = conj(tmp_J);
       if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
     }
     else return 0.0;
   }
   else return 0.0;

   origin = (int)off;

   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int tmp_off, off, j;
   int origin, ierr, ihermite;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   ihermite = TRUE;

   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin4 &&
     org_ispin2 == org_ispin3) { //cisaitcitais=cisais && cisaitcitais =cisais
     dam_pr = X_GC_child_CisAis_GeneralSpin_MPIdouble(org_isite1, org_ispin1, tmp_J, X, tmp_v0, tmp_v1);
     return (dam_pr);
   }
   //cisaitcisait
   if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite1 + 1, org_ispin1, org_ispin2,
     &tmp_off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {

     if (GetOffCompGeneralSpin(tmp_off, org_isite3 + 1, org_ispin3, org_ispin4,
       &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {

       tmp_V = tmp_J;
     }
     else ihermite = FALSE;
   }
   else {
     ihermite = FALSE;
   }

   if (ihermite == FALSE) {
     if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite3 + 1, org_ispin4, org_ispin3, &tmp_off,
       X->Def.SiteToBit, X->Def.Tpow) == TRUE) {

       if (GetOffCompGeneralSpin(tmp_off, org_isite1 + 1, org_ispin2, org_ispin1, &off, X->Def.SiteToBit,
                                       X->Def.Tpow) == TRUE) {
         tmp_V = conj(tmp_J);
         if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
       }
       else return 0.0;
     }
     else return 0.0;
   }

   origin = (int)off;

   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
   shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int) myrank, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);

   if (num1 == TRUE) {
     num1 = BitCheckGeneral((unsigned long int) myrank, org_isite3 + 1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow);
     if (num1 == TRUE) {
       tmp_V = tmp_J;
     }
     else return 0.0;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
   return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAit_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   double complex tmp_trans,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int off, j;
   int origin, ierr;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite1 + 1, org_ispin1, org_ispin2,
     &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     tmp_V = tmp_trans;
   }
   else if (GetOffCompGeneralSpin((unsigned long int) myrank,
     org_isite1 + 1, org_ispin2, org_ispin1, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     tmp_V = conj(tmp_trans);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
   }
   else return 0.0;

   origin = (int)off;

   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = v1buf[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
   return 0.0;
 #endif
 }/*double complex X_GC_child_CisAit_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAis_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   double complex tmp_trans,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int) myrank,
     org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);
   if (num1 != 0) {
     tmp_V = tmp_trans;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
   return 0.0;
 #endif
 }/*double complex X_GC_child_CisAis_GeneralSpin_MPIdouble*/
 double complex X_GC_child_AisCis_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   double complex tmp_trans,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int) myrank,
     org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);
   if (num1 == 0) {
     tmp_V = tmp_trans;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of Parallel region*/
   return dam_pr;
 #else
   return 0.0;
 #endif
 }/*double complex X_GC_child_AisCis_GeneralSpin_MPIdouble*/
 double complex X_child_CisAit_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   double complex tmp_trans,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1,
   double complex *tmp_v1buf,
   unsigned long int idim_max,
   long unsigned int *list_1_org,
   long unsigned int *list_1buf_org,
   long unsigned int _ihfbit
 )
 {
 #ifdef MPI
   unsigned long int off, j, tmp_off,idim_max_buf;
   int origin, ierr;
   double complex tmp_V, dmv;
   MPI_Status statusMPI;

   if (GetOffCompGeneralSpin((unsigned long int) myrank, org_isite1 + 1, org_ispin1, org_ispin2,
                             &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     tmp_V = tmp_trans;
   }
   else if (GetOffCompGeneralSpin((unsigned long int) myrank,
                                  org_isite1 + 1, org_ispin2, org_ispin1, &off,
                                  X->Def.SiteToBit, X->Def.Tpow) == TRUE) {
     tmp_V = conj(tmp_trans);
     if (X->Large.mode == M_CORR || X->Large.mode ==M_CALCSPEC) tmp_V = 0.0;
   }
   else return 0.0;

   origin = (int) off;

   ierr = MPI_Sendrecv(&idim_max,     1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf, 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if(ierr != 0) exitMPI(-1);

   ierr = MPI_Sendrecv(list_1_org,        idim_max + 1, MPI_UNSIGNED_LONG, origin, 0,
                       list_1buf_org, idim_max_buf + 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   ierr = MPI_Sendrecv(tmp_v1,    idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf, idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   if (X->Large.mode == M_MLTPLY || X->Large.mode ==M_CALCSPEC) {
 #pragma omp parallel for default(none)\
 firstprivate(X, tmp_V, idim_max_buf, list_1buf_org) private(j, dmv, tmp_off) \
 shared (tmp_v0, tmp_v1, v1buf)
     for (j = 1; j <= idim_max_buf; j++) {
       ConvertToList1GeneralSpin(list_1buf_org[j], X->Large.ihfbit, &tmp_off);
       dmv = v1buf[j] * tmp_V;
       tmp_v0[tmp_off] += dmv;
     }/*for (j = 1; j <= idim_max_buf; j++)*/
   }
   else {
     tmp_off = 0;
     return 0;
   }
   return 1;
 #else
  return 0.0;
 #endif
 }/*double complex X_child_CisAit_GeneralSpin_MPIdouble*/
 double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int off, j, num1;
   int origin, ierr, isite, IniSpin;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin3, org_ispin4, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = tmp_J;
     isite = org_isite1 + 1;
     IniSpin = org_ispin1;
   }
   else if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin4, org_ispin3, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
     isite = org_isite1 + 1;
     IniSpin = org_ispin1;
   }
   else return 0.0;

   origin = (int)off;

   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V, isite, IniSpin) \
 private(j, dmv, num1) shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(j - 1, isite, IniSpin, X->Def.SiteToBit, X->Def.Tpow);
         if (num1 != 0) {
           dmv = v1buf[j] * tmp_V;
           tmp_v0[j] += dmv;
           dam_pr += conj(tmp_v1[j]) * dmv;
         }/*if (num1 != 0)*/
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(j - 1, isite, IniSpin, X->Def.SiteToBit, X->Def.Tpow);
         if (num1 != 0) {
           dmv = v1buf[j] * tmp_V;
           dam_pr += conj(tmp_v1[j]) * dmv;
         }/*if (num1 != 0)*/
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIsingle*/
 double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int num1, j, off;
   int isite, IniSpin, FinSpin;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int)myrank,
     org_isite3+1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow);
   if(num1 != 0){
     tmp_V = tmp_J;
     isite = org_isite1 + 1;
     IniSpin = org_ispin2;
     FinSpin = org_ispin1;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) \
 firstprivate(X, tmp_V, isite, IniSpin, FinSpin) private(j, dmv, num1, off) \
 shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         if (GetOffCompGeneralSpin(j - 1, isite, IniSpin, FinSpin, &off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           dmv = tmp_v1[j] * tmp_V;
           tmp_v0[off + 1] += dmv;
           dam_pr += conj(tmp_v1[off + 1]) * dmv;
         }
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         if (GetOffCompGeneralSpin(j - 1, isite, IniSpin, FinSpin, &off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           dmv = tmp_v1[j] * tmp_V;
           dam_pr += conj(tmp_v1[off + 1]) * dmv;
         }
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIsingle*/
 double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int off, j;
   int origin, ierr, isite, IniSpin, FinSpin;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin3, org_ispin4, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = tmp_J;
     isite = org_isite1 + 1;
     IniSpin = org_ispin2;
     FinSpin = org_ispin1;
   }
   else if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin4, org_ispin3, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
     isite = org_isite1 + 1;
     IniSpin = org_ispin1;
     FinSpin = org_ispin2;
   }
   else return 0.0;

   origin = (int)off;

   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,  X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) \
 firstprivate(X, tmp_V, isite, IniSpin, FinSpin) private(j, dmv, off) shared (tmp_v0, tmp_v1, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         if (GetOffCompGeneralSpin(j - 1, isite, IniSpin, FinSpin, &off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           dmv = v1buf[j] * tmp_V;
           tmp_v0[off + 1] += dmv;
           dam_pr += conj(tmp_v1[off + 1]) * dmv;
         }
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         if (GetOffCompGeneralSpin(j - 1, isite, IniSpin, FinSpin, &off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           dmv = v1buf[j] * tmp_V;
           dam_pr += conj(tmp_v1[off + 1]) * dmv;
         }
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIsingle*/
 double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int)myrank, org_isite3+1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow);
   if (num1 != FALSE) {
     tmp_V = tmp_J;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) \
 firstprivate(X, tmp_V, org_isite1, org_ispin1) private(j, dmv, num1) shared (tmp_v0, tmp_v1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(j - 1, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);

         dmv = tmp_v1[j] * tmp_V * num1;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(j - 1, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);
         dmv = tmp_v1[j] * tmp_V * num1;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIsingle*/
 double complex X_child_CisAitCjuAjv_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int tmp_off, off, j, idim_max_buf;
   int origin, ierr;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;
   int ihermite=TRUE;

   if (GetOffCompGeneralSpin((unsigned long int)myrank, org_isite1 + 1, org_ispin1, org_ispin2, &tmp_off, X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     if (GetOffCompGeneralSpin(tmp_off, org_isite3 + 1, org_ispin3, org_ispin4, &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE)
     {
       tmp_V = tmp_J;
     }
     else{
       ihermite =FALSE;
     }
   }
   else{
     ihermite=FALSE;
   }

   if(ihermite==FALSE){
     if(GetOffCompGeneralSpin((unsigned long int)myrank, org_isite3 + 1, org_ispin4, org_ispin3, &tmp_off, X->Def.SiteToBit, X->Def.Tpow) == TRUE)
       {
  if (GetOffCompGeneralSpin(tmp_off, org_isite1 + 1, org_ispin2, org_ispin1, &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE)
    {
      tmp_V = conj(tmp_J);
      if(X->Large.mode == M_CORR|| X->Large.mode == M_CALCSPEC){
        tmp_V=0.0;
      }
    }
  else return 0.0;
       }
     else return 0.0;
   }


   origin = (int)off;

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(list_1, X->Check.idim_max + 1, MPI_UNSIGNED_LONG, origin, 0,
                       list_1buf,   idim_max_buf + 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V, idim_max_buf) \
 private(j, dmv, off) shared (tmp_v0, tmp_v1, list_1buf, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         ConvertToList1GeneralSpin(list_1buf[j], X->Check.sdim, &off);
         dmv = v1buf[j] * tmp_V;
         tmp_v0[off] += dmv;
         dam_pr += conj(tmp_v1[off]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {
         ConvertToList1GeneralSpin(list_1buf[j], X->Check.sdim, &off);
         dmv = v1buf[j] * tmp_V;
         dam_pr += conj(tmp_v1[off]) * dmv;
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_child_CisAitCjuAjv_GeneralSpin_MPIdouble*/
 double complex X_child_CisAisCjuAju_GeneralSpin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ) {
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;

   if (org_isite1 == org_isite3 && org_ispin1 == org_ispin3) {
     num1 = BitCheckGeneral((unsigned long int) myrank, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);
     if (num1 != FALSE) {
       tmp_V = tmp_J;
     }
     else {
       return 0.0;
     }
   }
   else {
     num1 = BitCheckGeneral((unsigned long int) myrank, org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);
     if (num1 != FALSE) {
       num1 = BitCheckGeneral((unsigned long int) myrank, org_isite3 + 1, org_ispin3, X->Def.SiteToBit,
         X->Def.Tpow);
       if (num1 != FALSE) {
         tmp_V = tmp_J;
       }
       else {
         return 0.0;
       }
     }
     else {
       return 0.0;
     }
   }
   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) firstprivate(X, tmp_V) private(j, dmv) \
 shared (tmp_v0, tmp_v1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = tmp_v1[j] * tmp_V;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_child_CisAisCjuAju_GeneralSpin_MPIdouble*/
 double complex X_child_CisAisCjuAju_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_isite3,
   int org_ispin3,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 )
 {
 #ifdef MPI
   unsigned long int j, num1;
   double complex tmp_V, dmv, dam_pr;
   //MPI_Status statusMPI;

   num1 = BitCheckGeneral((unsigned long int) myrank, org_isite3 + 1, org_ispin3, X->Def.SiteToBit, X->Def.Tpow);
   if (num1 != FALSE) {
     tmp_V = tmp_J;
   }
   else return 0.0;

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) \
 firstprivate(X, tmp_V, org_isite1, org_ispin1) private(j, dmv, num1) shared (tmp_v0, tmp_v1, list_1)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(list_1[j], org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);

         dmv = tmp_v1[j] * tmp_V * num1;
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         num1 = BitCheckGeneral(list_1[j], org_isite1 + 1, org_ispin1, X->Def.SiteToBit, X->Def.Tpow);

         dmv = tmp_v1[j] * tmp_V * num1;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_child_CisAisCjuAju_GeneralSpin_MPIsingle*/
 double complex X_child_CisAitCjuAjv_GeneralSpin_MPIsingle(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   int org_isite3,
   int org_ispin3,
   int org_ispin4,
   double complex tmp_J,
   struct BindStruct *X,
   double complex *tmp_v0,
   double complex *tmp_v1
 ){
 #ifdef MPI
   unsigned long int tmp_off, off, j, idim_max_buf;
   int origin, ierr, isite, IniSpin, FinSpin;
   double complex tmp_V, dmv, dam_pr;
   MPI_Status statusMPI;

   if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin3, org_ispin4, &off,
     X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = tmp_J;
     isite = org_isite1 + 1;
     IniSpin = org_ispin2;
     FinSpin = org_ispin1;
   }
   else if (GetOffCompGeneralSpin((unsigned long int)myrank,
     org_isite3 + 1, org_ispin4, org_ispin3, &off, X->Def.SiteToBit, X->Def.Tpow) == TRUE)
   {
     tmp_V = conj(tmp_J);
     if (X->Large.mode == M_CORR || X->Large.mode == M_CALCSPEC) tmp_V = 0.0;
     isite = org_isite1 + 1;
     IniSpin = org_ispin1;
     FinSpin = org_ispin2;
   }
   else return 0.0;

   origin = (int)off;

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(list_1, X->Check.idim_max + 1, MPI_UNSIGNED_LONG, origin, 0,
                       list_1buf,   idim_max_buf + 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) \
 firstprivate(X, tmp_V, idim_max_buf, IniSpin, FinSpin, isite) \
 private(j, dmv, off, tmp_off) shared (tmp_v0, tmp_v1, list_1buf, v1buf)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {

         if (GetOffCompGeneralSpin(list_1buf[j], isite, IniSpin, FinSpin, &tmp_off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           ConvertToList1GeneralSpin(tmp_off, X->Check.sdim, &off);
           dmv = v1buf[j] * tmp_V;
           tmp_v0[off] += dmv;
           dam_pr += conj(tmp_v1[off]) * dmv;
         }
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= idim_max_buf; j++) {

         if (GetOffCompGeneralSpin(list_1buf[j], isite, IniSpin, FinSpin, &tmp_off,
           X->Def.SiteToBit, X->Def.Tpow) == TRUE)
         {
           ConvertToList1GeneralSpin(tmp_off, X->Check.sdim, &off);
           dmv = v1buf[j] * tmp_V;
           dam_pr += conj(tmp_v1[off]) * dmv;
         }
       }/*for (j = 1; j <= idim_max_buf; j++)*/
     }
   }/*End of parallel region*/
   return dam_pr;
 #else
   return 0.0;
 #endif
 }/*double complex X_child_CisAitCjuAjv_GeneralSpin_MPIsingle*/
 double complex X_GC_child_CisAit_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   int org_ispin2,
   double complex tmp_trans,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
   double complex *tmp_v1 )
 {
 #ifdef MPI
   int mask1, state1, ierr, origin;
   unsigned long int idim_max_buf, j;
   MPI_Status statusMPI;
   double complex trans, dmv, dam_pr;

   mask1 = (int)X->Def.Tpow[org_isite1];
   origin = myrank ^ mask1;
   state1 = (origin & mask1)/mask1;

   //fprintf(stdout, "Debug: myrank=%d, origin=%d, state1=%d\n", myrank, origin, state1);

   if(state1 ==  org_ispin2){
     trans = tmp_trans;
   }
   else if(state1 == org_ispin1) {
     trans = conj(tmp_trans);
     if(X->Large.mode == M_CORR|| X->Large.mode ==M_CALCSPEC){
       trans = 0.0;
     }
   }
   else{
     return 0.0;
   }

   ierr = MPI_Sendrecv(&X->Check.idim_max, 1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf,      1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);
   ierr = MPI_Sendrecv(tmp_v1, X->Check.idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf,       idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   dam_pr = 0.0;
 #pragma omp parallel default(none) reduction(+:dam_pr) private(j, dmv) \
 firstprivate(idim_max_buf, trans, X) shared(v1buf, tmp_v1, tmp_v0)
   {
     if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = trans * v1buf[j];
         tmp_v0[j] += dmv;
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
     else {
 #pragma omp for
       for (j = 1; j <= X->Check.idim_max; j++) {
         dmv = trans * v1buf[j];
         dam_pr += conj(tmp_v1[j]) * dmv;
       }/*for (j = 1; j <= X->Check.idim_max; j++)*/
     }
   }/*End of parallel region*/
   return (dam_pr);
 #else
  return 0.0;
 #endif
 }/*double complex  X_GC_child_CisAit_spin_MPIdouble*/
 double complex X_child_CisAit_spin_MPIdouble(
   int org_isite1,
   int org_ispin2,
   double complex tmp_trans,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
   double complex *tmp_v1,
   double complex *tmp_v1buf,
   unsigned long int idim_max,
   long unsigned int *Tpow,
   long unsigned int *list_1_org,
   long unsigned int *list_1buf_org,
   long unsigned int *list_2_1_target,
   long unsigned int *list_2_2_target,
   long unsigned int _irght,
   long unsigned int _ilft,
   long unsigned int _ihfbit
 ){
 #ifdef MPI
   int mask1, state1, ierr, origin;
   unsigned long int idim_max_buf, j;
   unsigned long int tmp_off;
   MPI_Status statusMPI;
   double complex trans, dmv;

   mask1 = (int)X->Def.Tpow[org_isite1];
   origin = myrank ^ mask1;
   state1 = (origin & mask1)/mask1;

   if(state1 ==  org_ispin2){
     trans = tmp_trans;
   }
   else{
     trans =0.0;
   }

   //  fprintf(stdout, "Debug: myrank=%d, origin=%d, trans=%lf\n", myrank, origin, trans);

   ierr = MPI_Sendrecv(&idim_max,     1, MPI_UNSIGNED_LONG, origin, 0,
                       &idim_max_buf, 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   ierr = MPI_Sendrecv(list_1_org,        idim_max + 1, MPI_UNSIGNED_LONG, origin, 0,
                       list_1buf_org, idim_max_buf + 1, MPI_UNSIGNED_LONG, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   ierr = MPI_Sendrecv(tmp_v1,    idim_max + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       v1buf, idim_max_buf + 1, MPI_DOUBLE_COMPLEX, origin, 0,
                       MPI_COMM_WORLD, &statusMPI);
   if (ierr != 0) exitMPI(-1);

   if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) {
 #pragma omp parallel for default(none) private(j, dmv, tmp_off) \
 firstprivate(idim_max_buf, trans, X, list_1buf_org, list_2_1_target, list_2_2_target) \
 shared(v1buf, tmp_v0)
     for (j = 1; j <= idim_max_buf; j++) {
       GetOffComp(list_2_1_target, list_2_2_target, list_1buf_org[j], X->Large.irght, X->Large.ilft, X->Large.ihfbit, &tmp_off);
       dmv = trans * v1buf[j];
       tmp_v0[tmp_off] += dmv;
     }
   }
   else {
     tmp_off = 0;
     return 0;
   }
   return 1;
 #else
  return 0.0;
 #endif
 }/*double complex  X_child_CisAit_spin_MPIdouble*/
 double complex X_GC_child_CisAis_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   double complex tmp_trans,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
  double complex *tmp_v1
 ){
 #ifdef MPI
   long unsigned int j;
   int mask1;
   int ibit1;
   double complex dam_pr;
   mask1 = (int)X->Def.Tpow[org_isite1];
   ibit1 = (((unsigned long int)myrank& mask1)/mask1)^(1-org_ispin1);

   dam_pr = 0.0;
 #pragma omp parallel reduction(+:dam_pr)default(none) shared(tmp_v1, tmp_v0, ibit1) \
   firstprivate(X, tmp_trans) private(j)
   {
     if (ibit1 != 0) {
       if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) { // for multply
 #pragma omp for
         for (j = 1; j <= X->Check.idim_max; j++) {
           tmp_v0[j] += tmp_v1[j] * tmp_trans;
           dam_pr += tmp_trans * conj(tmp_v1[j]) * tmp_v1[j];
         }/*for (j = 1; j <= X->Check.idim_max; j++)*/
       }
       else {
 #pragma omp for
         for (j = 1; j <= X->Check.idim_max; j++) {
           dam_pr += tmp_trans * conj(tmp_v1[j]) * tmp_v1[j];
         }/*for (j = 1; j <= X->Check.idim_max; j++)*/
       }
     }/*if (ibit1 != 0)*/
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_CisAis_spin_MPIdouble*/
 double complex X_GC_child_AisCis_spin_MPIdouble(
   int org_isite1,
   int org_ispin1,
   double complex tmp_trans,
   struct BindStruct *X ,
   double complex *tmp_v0 ,
   double complex *tmp_v1
 ){
 #ifdef MPI
   long unsigned int j;
   int mask1;
   int ibit1;
   double complex dam_pr;
   mask1 = (int)X->Def.Tpow[org_isite1];
   ibit1 = (((unsigned long int)myrank& mask1) / mask1) ^ (1 - org_ispin1);

   dam_pr = 0.0;
 #pragma omp parallel reduction(+:dam_pr)default(none) shared(tmp_v1, tmp_v0, ibit1) \
   firstprivate(X, tmp_trans) private(j)
   {
     if (ibit1 == 0) {
       if (X->Large.mode == M_MLTPLY || X->Large.mode == M_CALCSPEC) { // for multply
 #pragma omp for
         for (j = 1; j <= X->Check.idim_max; j++) {
           tmp_v0[j] += tmp_v1[j] * tmp_trans;
           dam_pr += tmp_trans * conj(tmp_v1[j]) * tmp_v1[j];
         }/*for (j = 1; j <= X->Check.idim_max; j++)*/
       }
       else {
 #pragma omp for
         for (j = 1; j <= X->Check.idim_max; j++) {
           dam_pr += tmp_trans * conj(tmp_v1[j]) * tmp_v1[j];
         }/*for (j = 1; j <= X->Check.idim_max; j++)*/
       }
     }/*if (ibit1 == 0)*/
   }/*End of parallel region*/
   return dam_pr;
 #else
  return 0.0;
 #endif
 }/*double complex X_GC_child_AisCis_spin_MPIdouble*/
GC_child_CisAitCiuAiv_spin_MPIdouble
void GC_child_CisAitCiuAiv_spin_MPIdouble(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Exchange and Pairlifting term in Spin model + GC When both site1 and site2 are in the inter process r...
Definition: mltplyMPISpinCore.c:79

exitMPI
void exitMPI(int errorcode)
MPI Abortation wrapper.
Definition: wrapperMPI.c:86

X_child_CisAitCjuAjv_GeneralSpin_MPIsingle
double complex X_child_CisAitCjuAjv_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the canonical general spin system when one of these sites is in the inter process re...
Definition: mltplyMPISpinCore.c:1868

X_GC_child_CisAisCjuAju_spin_MPIdouble
double complex X_GC_child_CisAisCjuAju_spin_MPIdouble(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When both site1 and site2 are in the inter process region...
Definition: mltplyMPISpinCore.c:397

X_GC_child_CisAitCjuAjv_GeneralSpin_MPIsingle
double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when one of these site is in the inter proces...
Definition: mltplyMPISpinCore.c:1509

X_GC_child_CisAisCjuAjv_GeneralSpin_MPIdouble
double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
 term in Spin model. When both site1 and site3 are in the inter process region.
Definition: mltplyMPISpinCore.c:824

GC_child_CisAitCiuAiv_spin_MPIsingle
void GC_child_CisAitCiuAiv_spin_MPIsingle(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Exchange and Pairlifting term in Spin model + GC When only site2 is in the inter process region...
Definition: mltplyMPISpinCore.c:500

X_GC_child_CisAis_GeneralSpin_MPIdouble
double complex X_GC_child_CisAis_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:1190

X_GC_child_CisAis_spin_MPIdouble
double complex X_GC_child_CisAis_spin_MPIdouble(int org_isite1, int org_ispin1, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Hopping term in Spin + GC When both site1 and site2 are in the inter process region.
Definition: mltplyMPISpinCore.c:2117

X_GC_child_CisAitCjuAju_GeneralSpin_MPIsingle
double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when one of these site is in the inter proces...
Definition: mltplyMPISpinCore.c:1443

X_GC_child_CisAitCiuAiv_spin_MPIsingle
double complex X_GC_child_CisAitCiuAiv_spin_MPIsingle(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Exchange and Pairlifting term in Spin model + GC When only site2 is in the inter process region...
Definition: mltplyMPISpinCore.c:522

X_GC_child_CisAit_spin_MPIdouble
double complex X_GC_child_CisAit_spin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Hopping term in Spin + GC When both site1 and site2 are in the inter process region.
Definition: mltplyMPISpinCore.c:1965

X_child_CisAisCjuAju_GeneralSpin_MPIsingle
double complex X_child_CisAisCjuAju_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the canonical general spin system when one of these sites is in the inter process re...
Definition: mltplyMPISpinCore.c:1812

X_SpinGC_CisAis
int X_SpinGC_CisAis(long unsigned int j, struct BindStruct *X, long unsigned int is1_spin, long unsigned int sigma1)
Compute the grandcanonical spin state with bit mask is1_spin.
Definition: mltplySpinCore.c:184

list_1buf
long unsigned int * list_1buf
Definition: global.h:48

X_child_CisAisCjuAju_GeneralSpin_MPIdouble
double complex X_child_CisAisCjuAju_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the canonical general spin system when both sites are in the inter process region...
Definition: mltplyMPISpinCore.c:1743

GC_child_CisAisCjuAjv_spin_MPIsingle
void GC_child_CisAisCjuAjv_spin_MPIsingle(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Wrapper for CisAisCjuAjv term in Spin model + GC When only site2 is in the inter process region...
Definition: mltplyMPISpinCore.c:608

ConvertToList1GeneralSpin
int ConvertToList1GeneralSpin(const long unsigned int org_ibit, const long unsigned int ihlfbit, long unsigned int *_ilist1Comp)
function of converting component to list_1
Definition: bitcalc.c:285

GC_child_CisAisCjuAjv_spin_MPIdouble
void GC_child_CisAisCjuAjv_spin_MPIdouble(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Wrapper for calculating CisAisCjuAjv term in Spin model + GC When both site1 and site2 are in the int...
Definition: mltplyMPISpinCore.c:191

X_child_CisAitCjuAjv_GeneralSpin_MPIdouble
double complex X_child_CisAitCjuAjv_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the canonical general spin system when both sites are in the inter process region...
Definition: mltplyMPISpinCore.c:1647

X_GC_child_CisAisCjuAju_GeneralSpin_MPIdouble
double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:1070

X_GC_child_CisAisCjuAju_spin_MPIsingle
double complex X_GC_child_CisAisCjuAju_spin_MPIsingle(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When both site1 and site2 are in the inter process region...
Definition: mltplyMPISpinCore.c:448

X_GC_child_CisAitCjuAjv_GeneralSpin_MPIdouble
double complex X_GC_child_CisAitCjuAjv_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:979

TRUE
#define TRUE
Definition: global.h:26

list_1buf_org
long unsigned int * list_1buf_org
Definition: global.h:54

X_GC_child_CisAitCjuAju_spin_MPIsingle
double complex X_GC_child_CisAitCjuAju_spin_MPIsingle(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When only site2 is in the inter process region.
Definition: mltplyMPISpinCore.c:732

X_GC_child_CisAisCjuAjv_spin_MPIdouble
double complex X_GC_child_CisAisCjuAjv_spin_MPIdouble(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When both site1 and site2 are in the inter process region...
Definition: mltplyMPISpinCore.c:212

X_GC_child_CisAit_GeneralSpin_MPIdouble
double complex X_GC_child_CisAit_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:1126

X_child_CisAit_spin_MPIdouble
double complex X_child_CisAit_spin_MPIdouble(int org_isite1, int org_ispin2, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1, double complex *tmp_v1buf, unsigned long int idim_max, long unsigned int *Tpow, long unsigned int *list_1_org, long unsigned int *list_1buf_org, long unsigned int *list_2_1_target, long unsigned int *list_2_2_target, long unsigned int _irght, long unsigned int _ilft, long unsigned int _ihfbit)
Hopping term in Spin + Canonical for CalcSpectrum When both site1 and site2 are in the inter process ...
Definition: mltplyMPISpinCore.c:2039

BindStruct
Bind.
Definition: struct.h:408

GC_child_CisAitCjuAju_spin_MPIsingle
void GC_child_CisAitCjuAju_spin_MPIsingle(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Wrapper for CisAisCjuAjv term in Spin model + GC When only site2 is in the inter process region...
Definition: mltplyMPISpinCore.c:711

list_1_org
long unsigned int * list_1_org
Definition: global.h:53

GetOffComp
int GetOffComp(long unsigned int *_list_2_1, long unsigned int *_list_2_2, long unsigned int _ibit, const long unsigned int _irght, const long unsigned int _ilft, const long unsigned int _ihfbit, long unsigned int *_ioffComp)
function of getting off-diagonal component
Definition: bitcalc.c:195

FALSE
#define FALSE
Definition: global.h:25

list_1
long unsigned int * list_1
Definition: global.h:47

GC_child_CisAitCjuAju_spin_MPIdouble
void GC_child_CisAitCjuAju_spin_MPIdouble(unsigned long int i_int, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Wrapper for calculating CisAitCjuAju term in Spin model + GC When both site1 and site2 are in the int...
Definition: mltplyMPISpinCore.c:287

X_GC_child_AisCis_GeneralSpin_MPIdouble
double complex X_GC_child_AisCis_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:1240

BitCheckGeneral
int BitCheckGeneral(const long unsigned int org_bit, const unsigned int org_isite, const unsigned int target_ispin, const long int *SiteToBit, const long unsigned int *Tpow)
bit check function for general spin
Definition: bitcalc.c:393

X_GC_child_AisCis_spin_MPIdouble
double complex X_GC_child_AisCis_spin_MPIdouble(int org_isite1, int org_ispin1, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Hopping term in Spin + GC When both site1 and site2 are in the inter process region.
Definition: mltplyMPISpinCore.c:2164

X_GC_child_CisAitCjuAju_GeneralSpin_MPIdouble
double complex X_GC_child_CisAitCjuAju_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
 term in Spin model. When both site1 and site3 are in the inter process region.
Definition: mltplyMPISpinCore.c:906

X_child_CisAit_GeneralSpin_MPIdouble
double complex X_child_CisAit_GeneralSpin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, double complex tmp_trans, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1, double complex *tmp_v1buf, unsigned long int idim_max, long unsigned int *list_1_org, long unsigned int *list_1buf_org, long unsigned int _ihfbit)
Compute  term in the canonical general spin system when both site is in the inter process region...
Definition: mltplyMPISpinCore.c:1290

X
struct EDMainCalStruct X
Definition: struct.h:431

X_GC_child_CisAisCjuAjv_GeneralSpin_MPIsingle
double complex X_GC_child_CisAisCjuAjv_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when one of these site is in the inter proces...
Definition: mltplyMPISpinCore.c:1364

X_GC_child_CisAisCjuAjv_spin_MPIsingle
double complex X_GC_child_CisAisCjuAjv_spin_MPIsingle(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When only site2 is in the inter process region.
Definition: mltplyMPISpinCore.c:629

GetOffCompGeneralSpin
int GetOffCompGeneralSpin(const long unsigned int org_ibit, const int org_isite, const int org_ispin, const int off_ispin, long unsigned int *_ioffComp, const long int *SiteToBit, const long unsigned int *Tpow)
function of getting off-diagonal component for general spin
Definition: bitcalc.c:243

X_SpinGC_CisAit
int X_SpinGC_CisAit(long unsigned int j, struct BindStruct *X, long unsigned int is1_spin, long unsigned int sigma2, long unsigned int *tmp_off)
Compute index of final wavefunction by  term (grandcanonical).
Definition: mltplySpinCore.c:204

myrank
int myrank
Process ID, defined in InitializeMPI()
Definition: global.h:162

X_GC_child_CisAitCiuAiv_spin_MPIdouble
double complex X_GC_child_CisAitCiuAiv_spin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, int org_ispin4, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
 term in Spin model + GC. When both site1 and site2 are in the inter process region.
Definition: mltplyMPISpinCore.c:103

v1buf
double complex * v1buf
Definition: global.h:37

X_GC_child_CisAitCjuAju_spin_MPIdouble
double complex X_GC_child_CisAitCjuAju_spin_MPIdouble(int org_isite1, int org_ispin1, int org_ispin2, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
CisAisCjuAjv term in Spin model + GC When both site1 and site2 are in the inter process region...
Definition: mltplyMPISpinCore.c:309

X_GC_child_CisAisCjuAju_GeneralSpin_MPIsingle
double complex X_GC_child_CisAisCjuAju_GeneralSpin_MPIsingle(int org_isite1, int org_ispin1, int org_isite3, int org_ispin3, double complex tmp_J, struct BindStruct *X, double complex *tmp_v0, double complex *tmp_v1)
Compute  term in the grandcanonical general spin system when one of these site is in the inter proces...
Definition: mltplyMPISpinCore.c:1593