Context Navigation

perturbed.c@ 88e890

Visit:

Last change on this file since 88e890 was f5586e, checked in by Frederik Heber <heber@…>, 17 years ago

RealBasisQ[] removed

RealBasisQ[] is again replaced by sqrt(RealBasisSQ[]) as we are going to switch to a pure matrix transformation for calculating whether points are still within the periodic cell and so forth instead of "hoping" the simulation box is rectangular.

Property mode set to 100644

File size: 203.0 KB

Rev	Line
[a0bcf1]	1	/** \file perturbed.c
	2	* Perturbation calculation due to external magnetic field.
	3	*
	4	* Central function is MinimisePerturbed() wherein the actual minimisation of the two different operators with each
	5	* three components takes place subsequently. Helpful routines are CalculatePerturbationOperator_P() - which applies a
	6	* specified component of p on the current wave function - and CalculatePerturbationOperator_RxP() - which does the
	7	* same for the RxP operator.
	8	* The actual minimisation loop FindPerturbedMinimum() depends on the same routines also used for the occupied orbitals,
	9	* however with a different energy functional and derivatives, evaluated in Calculate1stPerturbedDerivative() and
	10	* Calculate2ndPerturbedDerivative(). InitPerturbedEnergyCalculation() calculates the total energy functional
	11	* perturbed in second order for all wave functions, UpdatePerturbedEnergyCalculation() just updates the one
	12	* for the wave function after it has been minimised during the line search. Both use CalculatePerturbedEnergy() which
	13	* evaluates the energy functional (and the gradient if specified).
	14	* Finally, FillCurrentDensity() evaluates the current density at a given point in space using the perturbed
	15	* wave functions. Afterwards by calling CalculateMagneticSusceptibility() or
	16	* CalculateChemicalShieldingByReciprocalCurrentDensity() susceptibility respectively shielding tensor are possible uses
	17	* of this current density.
	18	*
	19	* There are also some test routines: TestCurrent() checks whether the integrated current is zero in each component.
	20	* test_fft_symmetry() tests the "pulling out imaginary unit" before fourier transformation on a given wave function.
	21	* CheckOrbitalOverlap() outputs the overlap matrix for the wave functions of a given minimisation state, this might
	22	* be important for the additional \f$\Delta J{ij}\f$ contribution to the current density, which is non-zero for
	23	* non-zero mutual overlap, which is evaluated if FillDeltaCurrentDensity() is called.
	24	*
	25	* Finally, there are also some smaller routines: truedist() gives the correct relative distance between two points
	26	* in the unit cell under periodic boundary conditions with minimum image convention. ApplyTotalHamiltonian() returns
	27	* the hamiltonian applied to a given wave function. sawtooth() is a sawtooth implementation which is needed in order
	28	* to avoid flipping of position eigenvalues for nodes close to or on the cell boundary. CalculateOverlap()
	29	* is used in the energy functional derivatives, keeping an overlap table between perturbed wave functions up to date.
	30	* fft_Psi() is very similar to CalculateOneDensityR(), it does the extension of the wave function to the upper level
	31	* RunStruct#Lev0 while fouriertransforming it to real space. cross() gives correct indices in evaluating a vector cross
	32	* product. AllocCurrentDensity() and DisAllocCurrentDensity() mark the current density arrays as currently being in use or not.
	33	*
	34	Project: ParallelCarParrinello
	35	\author Frederik Heber
	36	\date 2006
	37
	38	*/
	39
	40	#include <stdlib.h>
	41	#include <stdio.h>
	42	#include <math.h>
	43	#include <string.h>
	44	#include <time.h>
	45	#include <gsl/gsl_matrix.h>
	46	#include <gsl/gsl_eigen.h>
	47	#include <gsl/gsl_complex.h>
	48	#include <gsl/gsl_complex_math.h>
	49	#include <gsl/gsl_sort_vector.h>
	50	#include <gsl/gsl_linalg.h>
	51	#include <gsl/gsl_multimin.h>
	52
	53	#include "data.h"
	54	#include "density.h"
	55	#include "energy.h"
	56	#include "excor.h"
	57	#include "errors.h"
	58	#include "grad.h"
	59	#include "gramsch.h"
	60	#include "mergesort2.h"
	61	#include "helpers.h"
	62	#include "init.h"
	63	#include "myfft.h"
	64	#include "mymath.h"
	65	#include "output.h"
	66	#include "pcp.h"
	67	#include "perturbed.h"
	68	#include "run.h"
	69	#include "wannier.h"
	70
	71	/** evaluates perturbed energy functional.
	72	* \param norm norm of current Psi in functional
	73	* \param *params void-pointer to parameter array
	74	* \return evaluated functional at f(x) with \a norm
	75	*/
	76	double perturbed_function (double norm, void *params) {
	77	struct Problem P = (struct Problem )params;
	78	int i, n = P->R.LevS->MaxG;
	79	double old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
	80	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
	81	fprintf(stderr,"(%i) perturbed_function: setting norm to %lg ...", P->Par.me, norm);
	82	// set desired norm for current Psi
	83	for (i=0; i< n; i++) {
	84	currentPsi[i].re *= norm/old_norm; // real part
	85	currentPsi[i].im *= norm/old_norm; // imaginary part
	86	}
	87	P->R.PsiStep = 0; // make it not advance to next Psi
	88
	89	//debug(P,"UpdateActualPsiNo");
	90	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
	91	//debug(P,"UpdateEnergyArray");
	92	UpdateEnergyArray(P); // shift energy values in their array by one
	93	//debug(P,"UpdatePerturbedEnergyCalculation");
	94	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
	95	EnergyAllReduce(P); // gather from all processes and sum up to total energy
	96	/*
	97	for (i=0; i< n; i++) {
	98	currentPsi[i].re /= norm/old_norm; // real part
	99	currentPsi[i].im /= norm/old_norm; // imaginary part
	100	}*/
	101
	102	fprintf(stderr,"%lg\n", P->Lat.E->TotalEnergy[0]);
	103	return P->Lat.E->TotalEnergy[0]; // and return evaluated functional
	104	}
	105
	106	/** evaluates perturbed energy functional.
	107	* \param *x current position in functional
	108	* \param *params void-pointer to parameter array
	109	* \return evaluated functional at f(x)
	110	*/
	111	double perturbed_f (const gsl_vector x, void params) {
	112	struct Problem P = (struct Problem )params;
	113	int i, n = P->R.LevS->MaxG*2;
	114	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
	115	//int diff = 0;
	116	//debug(P,"f");
	117	// put x into current Psi
	118	for (i=0; i< n; i+=2) {
	119	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
	120	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
	121	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
	122	}
	123	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
	124	P->R.PsiStep = 0; // make it not advance to next Psi
	125
	126	//debug(P,"UpdateActualPsiNo");
	127	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
	128	//debug(P,"UpdateEnergyArray");
	129	UpdateEnergyArray(P); // shift energy values in their array by one
	130	//debug(P,"UpdatePerturbedEnergyCalculation");
	131	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
	132	EnergyAllReduce(P); // gather from all processes and sum up to total energy
	133
	134	return P->Lat.E->TotalEnergy[0]; // and return evaluated functional
	135	}
	136
	137	/** evaluates perturbed energy gradient.
	138	* \param *x current position in functional
	139	* \param *params void-pointer to parameter array
	140	* \param *g array for gradient vector on return
	141	*/
	142	void perturbed_df (const gsl_vector x, void params, gsl_vector *g) {
	143	struct Problem P = (struct Problem )params;
	144	int i, n = P->R.LevS->MaxG*2;
	145	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
	146	fftw_complex *gradient = P->Grad.GradientArray[ActualGradient];
	147	//int diff = 0;
	148	//debug(P,"df");
	149	// put x into current Psi
	150	for (i=0; i< n; i+=2) {
	151	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
	152	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
	153	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
	154	}
	155	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
	156	P->R.PsiStep = 0; // make it not advance to next Psi
	157
	158	//debug(P,"UpdateActualPsiNo");
	159	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
	160	//debug(P,"UpdateEnergyArray");
	161	UpdateEnergyArray(P); // shift energy values in their array by one
	162	//debug(P,"UpdatePerturbedEnergyCalculation");
	163	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
	164	EnergyAllReduce(P); // gather from all processes and sum up to total energy
	165
	166	// checkout gradient
	167	//diff = 0;
	168	for (i=0; i< n; i+=2) {
	169	//if ((-gradient[i/2].re != gsl_vector_get (g, i)) \|\| (-gradient[i/2].im != gsl_vector_get (g, i+1))) diff++;
	170	gsl_vector_set (g, i, -gradient[i/2].re); // real part
	171	gsl_vector_set (g, i+1, -gradient[i/2].im); // imaginary part
	172	}
	173	//if (diff) fprintf(stderr,"(%i) %i differences between old and new gradient.\n", P->Par.me, diff);
	174	}
	175
	176	/** evaluates perturbed energy functional and gradient.
	177	* \param *x current position in functional
	178	* \param *params void-pointer to parameter array
	179	* \param *f pointer to energy function value on return
	180	* \param *g array for gradient vector on return
	181	*/
	182	void perturbed_fdf (const gsl_vector x, void params, double f, gsl_vector g) {
	183	struct Problem P = (struct Problem )params;
	184	int i, n = P->R.LevS->MaxG*2;
	185	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
	186	fftw_complex *gradient = P->Grad.GradientArray[ActualGradient];
	187	//int diff = 0;
	188	//debug(P,"fdf");
	189	// put x into current Psi
	190	for (i=0; i< n; i+=2) {
	191	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
	192	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
	193	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
	194	}
	195	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
	196	P->R.PsiStep = 0; // make it not advance to next Psi
	197
	198	//debug(P,"UpdateActualPsiNo");
	199	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
	200	//debug(P,"UpdateEnergyArray");
	201	UpdateEnergyArray(P); // shift energy values in their array by one
	202	//debug(P,"UpdatePerturbedEnergyCalculation");
	203	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
	204	EnergyAllReduce(P); // gather from all processes and sum up to total energy
	205
	206	// checkout gradient
	207	//diff = 0;
	208	for (i=0; i< n; i+=2) {
	209	//if ((-gradient[i/2].re != gsl_vector_get (g, i)) \|\| (-gradient[i/2].im != gsl_vector_get (g, i+1))) diff++;
	210	gsl_vector_set (g, i, -gradient[i/2].re); // real part
	211	gsl_vector_set (g, i+1, -gradient[i/2].im); // imaginary part
	212	}
	213	//if (diff) fprintf(stderr,"(%i) %i differences between old and new gradient.\n", P->Par.me, diff);
	214
	215	*f = P->Lat.E->TotalEnergy[0]; // and return evaluated functional
	216	}
	217
	218	/** Minimisation of the PsiTypeTag#Perturbed_RxP0, PsiTypeTag#Perturbed_P0 and other orbitals.
	219	* For each of the above PsiTypeTag we go through the following before the minimisation loop:
	220	* -# ResetGramSchTagType() resets current type that is to be minimised to NotOrthogonal.
	221	* -# UpdateActualPsiNo() steps on to next perturbed of current PsiTypeTag type.
	222	* -# GramSch() orthonormalizes perturbed wave functions.
	223	* -# TestGramSch() tests if orthonormality was achieved.
	224	* -# InitDensityCalculation() gathers densities from all wave functions (and all processes), within SpeedMeasure() DensityTime.
	225	* -# InitPerturbedEnergyCalculation() performs initial calculation of the perturbed energy functional.
	226	* -# RunStruct#OldActualLocalPsiNo is set to RunStruct#ActualLocalPsiNo, immediately followed by UpdateGramSchOldActualPsiNo()
	227	* to bring info on all processes on par.
	228	* -# UpdatePerturbedEnergyCalculation() re-calculates Gradient and GradientTypes#H1cGradient for RunStruct#ActualLocalPsiNo
	229	* -# EnergyAllReduce() gathers various energy terms and sums up into Energy#TotalEnergy.
	230	*
	231	* And during the minimisation loop:
	232	* -# FindPerturbedMinimum() performs the gradient conjugation, the line search and wave function update.
	233	* -# UpdateActualPsiNo() steps on to the next wave function, orthonormalizing by GramSch() if necessary.
	234	* -# UpdateEnergyArray() shifts TotalEnergy values to make space for new one.
	235	* -# There is no density update as the energy function does not depend on the changing perturbed density but only on the fixed
	236	* unperturbed one.
	237	* -# UpdatePerturbedEnergyCalculation() re-calculates the perturbed energy of the changed wave function.
	238	* -# EnergyAllReduce() gathers energy terms and sums up.
	239	* -# CheckCPULIM() checks if external Stop signal has been given.
	240	* -# CalculateMinimumStop() checks whether we have dropped below a certain minimum change during minimisation of total energy.
	241	* -# finally step counters LatticeLevel#Step and SpeedStruct#Steps are increased.
	242	*
	243	* After the minimisation loop:
	244	* -# SetGramSchExtraPsi() removes extra Psis from orthogonaliy check.
	245	* -# ResetGramSchTagType() sets GramSchToDoType to NotUsedtoOrtho.
	246	*
	247	* And after all minimisation runs are done:
	248	* -# UpdateActualPsiNo() steps back to PsiTypeTag#Occupied type.
	249	*
	250	* At the end we return to Occupied wave functions.
	251	* \param *P at hand
	252	* \param *Stop flag to determine if epsilon stop conditions have met
	253	* \param *SuperStop flag to determinte whether external signal's required end of calculations
	254	*/
	255	void MinimisePerturbed (struct Problem P, int Stop, int *SuperStop) {
	256	struct RunStruct *R = &P->R;
	257	struct Lattice *Lat = &P->Lat;
	258	struct Psis *Psi = &Lat->Psi;
	259	int type;
	260	//int i;
	261
	262	// stuff for GSL minimization
	263	//size_t iter;
	264	//int status, Status
	265	int n = R->LevS->MaxG*2;
	266	const gsl_multimin_fdfminimizer_type *T_multi;
	267	const gsl_min_fminimizer_type *T;
	268	gsl_multimin_fdfminimizer *s_multi;
	269	gsl_min_fminimizer *s;
	270	gsl_vector x;//, ss;
	271	gsl_multimin_function_fdf my_func;
	272	gsl_function F;
	273	//fftw_complex *currentPsi;
	274	//double a,b,m, f_m, f_a, f_b;
	275	//double old_norm;
	276
	277	my_func.f = &perturbed_f;
	278	my_func.df = &perturbed_df;
	279	my_func.fdf = &perturbed_fdf;
	280	my_func.n = n;
	281	my_func.params = P;
	282	F.function = &perturbed_function;
	283	F.params = P;
	284
	285	x = gsl_vector_alloc (n);
	286	//ss = gsl_vector_alloc (Psi->NoOfPsis);
	287	T_multi = gsl_multimin_fdfminimizer_vector_bfgs;
	288	s_multi = gsl_multimin_fdfminimizer_alloc (T_multi, n);
	289	T = gsl_min_fminimizer_brent;
	290	s = gsl_min_fminimizer_alloc (T);
	291
	292	for (type=Perturbed_P0;type<=Perturbed_RxP2;type++) { // go through each perturbation group separately //
	293	*Stop=0; // reset stop flag
	294	fprintf(stderr,"(%i)Beginning perturbed minimisation of type %s ...\n", P->Par.me, R->MinimisationName[type]);
	295	//OutputOrbitalPositions(P, Occupied);
	296	R->PsiStep = R->MaxPsiStep; // reset in-Psi-minimisation-counter, so that we really advance to the next wave function
	297	UpdateActualPsiNo(P, type); // step on to next perturbed one
	298	fprintf(stderr, "(%i) Re-initializing perturbed psi array for type %s ", P->Par.me, R->MinimisationName[type]);
	299	if (P->Call.ReadSrcFiles && ReadSrcPsiDensity(P,type,1, R->LevSNo)) {
	300	SpeedMeasure(P, InitSimTime, StartTimeDo);
	301	fprintf(stderr,"from source file of recent calculation\n");
	302	ReadSrcPsiDensity(P,type, 0, R->LevSNo);
	303	ResetGramSchTagType(P, Psi, type, IsOrthogonal); // loaded values are orthonormal
	304	SpeedMeasure(P, DensityTime, StartTimeDo);
	305	//InitDensityCalculation(P);
	306	SpeedMeasure(P, DensityTime, StopTimeDo);
	307	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
	308	UpdateGramSchOldActualPsiNo(P,Psi);
	309	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
	310	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
	311	EnergyAllReduce(P); // gather energies for minimum search
	312	SpeedMeasure(P, InitSimTime, StopTimeDo);
	313	}
	314	if (P->Call.ReadSrcFiles != 1) {
	315	SpeedMeasure(P, InitSimTime, StartTimeDo);
	316	ResetGramSchTagType(P, Psi, type, NotOrthogonal); // perturbed now shall be orthonormalized
	317	if (P->Call.ReadSrcFiles != 2) {
	318	if (R->LevSNo == Lat->MaxLevel-1) { // is it the starting level? (see InitRunLevel())
	319	fprintf(stderr, "randomly.\n");
	320	InitPsisValue(P, Psi->TypeStartIndex[type], Psi->TypeStartIndex[type+1]); // initialize perturbed array for this run
	321	} else {
	322	fprintf(stderr, "from source file of last level.\n");
	323	ReadSrcPerturbedPsis(P, type);
	324	}
	325	}
	326	SpeedMeasure(P, InitGramSchTime, StartTimeDo);
	327	GramSch(P, R->LevS, Psi, Orthogonalize);
	328	SpeedMeasure(P, InitGramSchTime, StopTimeDo);
	329	SpeedMeasure(P, InitDensityTime, StartTimeDo);
	330	//InitDensityCalculation(P);
	331	SpeedMeasure(P, InitDensityTime, StopTimeDo);
	332	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
	333	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
	334	UpdateGramSchOldActualPsiNo(P,Psi);
	335	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
	336	EnergyAllReduce(P); // gather energies for minimum search
	337	SpeedMeasure(P, InitSimTime, StopTimeDo);
	338	R->LevS->Step++;
	339	EnergyOutput(P,0);
	340	while (*Stop != 1) {
	341	/* // copy current Psi into starting vector
	342	currentPsi = R->LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
	343	for (i=0; i< n; i+=2) {
	344	gsl_vector_set (x, i, currentPsi[i/2].re); // real part
	345	gsl_vector_set (x, i+1, currentPsi[i/2].im); // imaginary part
	346	}
	347	gsl_multimin_fdfminimizer_set (s_multi, &my_func, x, 0.01, 1e-2);
	348	iter = 0;
	349	status = 0;
	350	do { // look for minimum along current local psi
	351	iter++;
	352	status = gsl_multimin_fdfminimizer_iterate (s_multi);
	353	MPI_Allreduce(&status, &Status, 1, MPI_INT, MPI_MAX, P->Par.comm_ST_Psi);
	354	if (Status)
	355	break;
	356	status = gsl_multimin_test_gradient (s_multi->gradient, 1e-2);
	357	MPI_Allreduce(&status, &Status, 1, MPI_INT, MPI_MAX, P->Par.comm_ST_Psi);
	358	//if (Status == GSL_SUCCESS)
	359	//printf ("Minimum found at:\n");
	360	if (P->Par.me == 0) fprintf (stderr,"(%i,%i,%i)S(%i,%i,%i):\t %5d %10.5f\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, (int)iter, s_multi->f);
	361	//TestGramSch(P,R->LevS,Psi, type); // functions are orthonormal?
	362	} while (Status == GSL_CONTINUE && iter < 3);
	363	/* // now minimize norm of currentPsi (one-dim)
	364	if (0) {
	365	iter = 0;
	366	status = 0;
	367	m = 1.;
	368	a = MYEPSILON;
	369	b = 100.;
	370	f_a = perturbed_function (a, P);
	371	f_b = perturbed_function (b, P);
	372	f_m = perturbed_function (m, P);
	373	//if ((f_m < f_a) && (f_m < f_b)) {
	374	gsl_min_fminimizer_set (s, &F, m, a, b);
	375	do { // look for minimum along current local psi
	376	iter++;
	377	status = gsl_min_fminimizer_iterate (s);
	378	m = gsl_min_fminimizer_x_minimum (s);
	379	a = gsl_min_fminimizer_x_lower (s);
	380	b = gsl_min_fminimizer_x_upper (s);
	381	status = gsl_min_test_interval (a, b, 0.001, 0.0);
	382	if (status == GSL_SUCCESS)
	383	printf ("Minimum found at:\n");
	384	printf ("%5d [%.7f, %.7f] %.7f %.7f\n",
	385	(int) iter, a, b,
	386	m, b - a);
	387	} while (status == GSL_CONTINUE && iter < 100);
	388	old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
	389	for (i=0; i< n; i++) {
	390	currentPsi[i].re *= m/old_norm; // real part
	391	currentPsi[i].im *= m/old_norm; // imaginary part
	392	}
	393	} else debug(P,"Norm not minimizable!");*/
	394	//P->R.PsiStep = P->R.MaxPsiStep; // make it advance to next Psi
	395	FindPerturbedMinimum(P);
	396	//debug(P,"UpdateActualPsiNo");
	397	UpdateActualPsiNo(P, type); // step on to next perturbed Psi
	398	//debug(P,"UpdateEnergyArray");
	399	UpdateEnergyArray(P); // shift energy values in their array by one
	400	//debug(P,"UpdatePerturbedEnergyCalculation");
	401	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
	402	EnergyAllReduce(P); // gather from all processes and sum up to total energy
	403	//ControlNativeDensity(P); // check total density (summed up PertMixed must be zero!)
	404	//printf ("(%i,%i,%i)S(%i,%i,%i):\t %5d %10.5f\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, (int)iter, s_multi->f);
	405	if (*SuperStop != 1)
	406	*SuperStop = CheckCPULIM(P);
	407	Stop = CalculateMinimumStop(P, SuperStop);
	408	P->Speed.Steps++; // step on
	409	R->LevS->Step++;
	410	}
	411	// now release normalization condition and minimize wrt to norm
	412	/* *Stop = 0;
	413	while (*Stop != 1) {
	414	currentPsi = R->LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
	415	iter = 0;
	416	status = 0;
	417	m = 1.;
	418	a = 0.001;
	419	b = 10.;
	420	f_a = perturbed_function (a, P);
	421	f_b = perturbed_function (b, P);
	422	f_m = perturbed_function (m, P);
	423	if ((f_m < f_a) && (f_m < f_b)) {
	424	gsl_min_fminimizer_set (s, &F, m, a, b);
	425	do { // look for minimum along current local psi
	426	iter++;
	427	status = gsl_min_fminimizer_iterate (s);
	428	m = gsl_min_fminimizer_x_minimum (s);
	429	a = gsl_min_fminimizer_x_lower (s);
	430	b = gsl_min_fminimizer_x_upper (s);
	431	status = gsl_min_test_interval (a, b, 0.001, 0.0);
	432	if (status == GSL_SUCCESS)
	433	printf ("Minimum found at:\n");
	434	printf ("%5d [%.7f, %.7f] %.7f %.7f\n",
	435	(int) iter, a, b,
	436	m, b - a);
	437	} while (status == GSL_CONTINUE && iter < 100);
	438	old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
	439	for (i=0; i< n; i++) {
	440	currentPsi[i].re *= m/old_norm; // real part
	441	currentPsi[i].im *= m/old_norm; // imaginary part
	442	}
	443	}
	444	P->R.PsiStep = P->R.MaxPsiStep; // make it advance to next Psi
	445	//debug(P,"UpdateActualPsiNo");
	446	UpdateActualPsiNo(P, type); // step on to next perturbed Psi
	447	if (*SuperStop != 1)
	448	*SuperStop = CheckCPULIM(P);
	449	Stop = CalculateMinimumStop(P, SuperStop);
	450	P->Speed.Steps++; // step on
	451	R->LevS->Step++;
	452	}*/
	453	if(P->Call.out[NormalOut]) fprintf(stderr,"(%i) Write %s srcpsi to disk\n", P->Par.me, R->MinimisationName[type]);
	454	OutputSrcPsiDensity(P, type);
	455	// if (!TestReadnWriteSrcDensity(P,type))
	456	// Error(SomeError,"TestReadnWriteSrcDensity failed!");
	457	}
	458
	459	TestGramSch(P,R->LevS,Psi, type); // functions are orthonormal?
	460	// calculate current density summands
	461	//if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Filling current density grid ...\n",P->Par.me);
	462	SpeedMeasure(P, CurrDensTime, StartTimeDo);
	463	if (*SuperStop != 1) {
	464	if ((R->DoFullCurrent == 1) \|\| ((R->DoFullCurrent == 2) && (CheckOrbitalOverlap(P) == 1))) { //test to check whether orbitals have mutual overlap and thus \\DeltaJ_{xc} must not be dropped
	465	R->DoFullCurrent = 1; // set to 1 if it was 2 but Check...() yielded necessity
	466	//debug(P,"Filling with Delta j ...");
	467	//FillDeltaCurrentDensity(P);
	468	}// else
	469	//debug(P,"There is no overlap between orbitals.");
	470	//debug(P,"Filling with j ...");
	471	FillCurrentDensity(P);
	472	}
	473	SpeedMeasure(P, CurrDensTime, StopTimeDo);
	474
	475	SetGramSchExtraPsi(P,Psi,NotUsedToOrtho); // remove extra Psis from orthogonality check
	476	ResetGramSchTagType(P, Psi, type, NotUsedToOrtho); // remove this group from the check for the next minimisation group as well!
	477	}
	478	UpdateActualPsiNo(P, Occupied); // step on back to an occupied one
	479
	480	gsl_multimin_fdfminimizer_free (s_multi);
	481	gsl_min_fminimizer_free (s);
	482	gsl_vector_free (x);
	483	//gsl_vector_free (ss);
	484	}
	485
	486	/** Tests overlap matrix between each pair of orbitals for non-diagonal form.
	487	* We simply check whether the overlap matrix Psis#lambda has off-diagonal entries greater MYEPSILON or not.
	488	* \param *P Problem at hand
	489	* \note The routine is meant as atest criteria if \f$\Delta J_[ij]\f$ contribution is necessary, as it is only non-zero if
	490	* there is mutual overlap between the two orbitals.
	491	*/
	492	int CheckOrbitalOverlap(struct Problem *P)
	493	{
	494	struct Lattice *Lat = &P->Lat;
	495	struct Psis *Psi = &Lat->Psi;
	496	int i,j;
	497	int counter = 0;
	498
	499	// output matrix
	500	if (P->Par.me == 0) fprintf(stderr, "(%i) S_ij =\n", P->Par.me);
	501	for (i=0;i<Psi->NoOfPsis;i++) {
	502	for (j=0;j<Psi->NoOfPsis;j++) {
	503	if (fabs(Psi->lambda[i][j]) > MYEPSILON) counter++;
	504	if (P->Par.me == 0) fprintf(stderr, "%e\t", Psi->lambda[i][j]); //Overlap[i][j]
	505	}
	506	if (P->Par.me == 0) fprintf(stderr, "\n");
	507	}
	508
	509	fprintf(stderr, "(%i) CheckOverlap: %i overlaps found.\t", P->Par.me, counter);
	510	if (counter > 0) return (1);
	511	else return(0);
	512	}
	513
	514	/** Initialization of perturbed energy.
	515	* For each local wave function of the current minimisation type RunStruct#CurrentMin it is called:
	516	* - CalculateNonLocalEnergyNoRT(): for the coefficient-dependent form factors
	517	* - CalculatePerturbedEnergy(): for the perturbed energy, yet without gradient calculation
	518	* - CalculateOverlap(): for the overlap between the perturbed wave functions of the current RunStruct#CurrentMin state.
	519	*
	520	* Afterwards for the two types AllPsiEnergyTypes#Perturbed1_0Energy and AllPsiEnergyTypes#Perturbed0_1Energy the
	521	* energy contribution from each wave function is added up in Energy#AllLocalPsiEnergy.
	522	* \param *P Problem at hand
	523	* \param first state whether it is the first (1) or successive call (0), which avoids some initial calculations.
	524	* \sa UpdatePerturbedEnergy()
	525	* \note Afterwards EnergyAllReduce() must be called.
	526	*/
	527	void InitPerturbedEnergyCalculation(struct Problem *P, const int first)
	528	{
	529	struct Lattice *Lat = &(P->Lat);
	530	int p,i;
	531	const enum PsiTypeTag state = P->R.CurrentMin;
	532	for (p=Lat->Psi.TypeStartIndex[state]; p < Lat->Psi.TypeStartIndex[state+1]; p++) {
	533	//if (p < 0 \|\| p >= Lat->Psi.LocalNo) Error(SomeError,"InitPerturbedEnergyCalculation: p out of range");
	534	CalculateNonLocalEnergyNoRT(P, p); // recalculating non-local form factors which are coefficient dependent!
	535	CalculatePsiEnergy(P,p,1);
	536	CalculatePerturbedEnergy(P, p, 0, first);
	537	CalculateOverlap(P, p, state);
	538	}
	539	for (i=0; i<= Perturbed0_1Energy; i++) {
	540	Lat->E->AllLocalPsiEnergy[i] = 0.0;
	541	for (p=0; p < Lat->Psi.LocalNo; p++)
	542	if (P->Lat.Psi.LocalPsiStatus[p].PsiType == state)
	543	Lat->E->AllLocalPsiEnergy[i] += Lat->E->PsiEnergy[i][p];
	544	}
	545	}
	546
	547
	548	/** Updating of perturbed energy.
	549	* For current and former (if not the same) local wave function RunStruct#ActualLocal, RunStruct#OldActualLocalPsiNo it is called:
	550	* - CalculateNonLocalEnergyNoRT(): for the form factors
	551	* - CalculatePerturbedEnergy(): for the perturbed energy, gradient only for RunStruct#ActualLocal
	552	* - CalculatePerturbedOverlap(): for the overlap between the perturbed wave functions
	553	*
	554	* Afterwards for the two types AllPsiEnergyTypes#Perturbed1_0Energy and AllPsiEnergyTypes#Perturbed0_1Energy the
	555	* energy contribution from each wave function is added up in Energy#AllLocalPsiEnergy.
	556	* \param *P Problem at hand
	557	* \sa CalculatePerturbedEnergy() called from here.
	558	* \note Afterwards EnergyAllReduce() must be called.
	559	*/
	560	void UpdatePerturbedEnergyCalculation(struct Problem *P)
	561	{
	562	struct Lattice *Lat = &(P->Lat);
	563	struct Psis *Psi = &Lat->Psi;
	564	struct RunStruct *R = &P->R;
	565	const enum PsiTypeTag state = R->CurrentMin;
	566	int p = R->ActualLocalPsiNo;
	567	const int p_old = R->OldActualLocalPsiNo;
	568	int i;
	569
	570	if (p != p_old) {
	571	//if (p_old < 0 \|\| p_old >= Lat->Psi.LocalNo) Error(SomeError,"UpdatePerturbedEnergyCalculation: p_old out of range");
	572	CalculateNonLocalEnergyNoRT(P, p_old);
	573	CalculatePsiEnergy(P,p_old,0);
	574	CalculatePerturbedEnergy(P, p_old, 0, 0);
	575	CalculateOverlap(P, p_old, state);
	576	}
	577	//if (p < 0 \|\| p >= Lat->Psi.LocalNo) Error(SomeError,"InitPerturbedEnergyCalculation: p out of range");
	578	// recalculating non-local form factors which are coefficient dependent!
	579	CalculateNonLocalEnergyNoRT(P,p);
	580	CalculatePsiEnergy(P,p,0);
	581	CalculatePerturbedEnergy(P, p, 1, 0);
	582	CalculateOverlap(P, p, state);
	583
	584	for (i=0; i<= Perturbed0_1Energy; i++) {
	585	Lat->E->AllLocalPsiEnergy[i] = 0.0;
	586	for (p=0; p < Psi->LocalNo; p++)
	587	if (Psi->LocalPsiStatus[p].PsiType == state)
	588	Lat->E->AllLocalPsiEnergy[i] += Lat->E->PsiEnergy[i][p];
	589	}
	590	}
	591
	592	/** Calculates gradient and evaluates second order perturbed energy functional for specific wave function.
	593	* The in second order perturbed energy functional reads as follows.
	594	* \f[
	595	* E^{(2)} = \sum_{kl} \langle \varphi_k^{(1)} \| H^{(0)} \delta_{kl} - \lambda_{kl} \| \varphi_l^{(1)} \rangle
	596	* + \underbrace{\langle \varphi_l^{(0)} \| H^{(1)} \| \varphi_l^{(1)} \rangle + \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle}_{2 {\cal R} \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle}
	597	* \f]
	598	* And the gradient
	599	* \f[
	600	* \widetilde{\varphi}_k^{(1)} = - \sum_l ({\cal H}^{(0)} \delta_{kl} - \lambda_{kl} \| \varphi_l^{(1)} \rangle + {\cal H}^{(1)} \| \varphi_k^{(0)} \rangle
	601	* \f]
	602	* First, the HGDensity is recalculated if \a first says so - see ApplyTotalHamiltonian().
	603	*
	604	* Next, we need the perturbation hamiltonian acting on both the respective occupied and current wave function,
	605	* see perturbed.c for respective function calls.
	606	*
	607	* Finally, the scalar product between the wave function and Hc_Gradient yields the eigenvalue of the hamiltonian,
	608	* which is summed up over all reciprocal grid vectors and stored in OnePsiElementAddData#Lambda. The Gradient is
	609	* the inverse of Hc_Gradient and with the following summation over all perturbed wave functions (MPI exchange of
	610	* non-local coefficients) the gradient is computed. Here we need Psis#lambda, which is computed in CalculateHamiltonian().
	611	*
	612	* Also \f${\cal H}^{(1)} \| \varphi_l^{(0)} \rangle\f$ is stored in GradientTypes#H1cGradient.
	613	* \param *P Problem at hand, contains RunStruct, Lattice, LatticeLevel RunStruct#LevS
	614	* \param l offset of perturbed wave function within Psi#LocalPsiStatus (\f$\varphi_l^{(1)}\f$)
	615	* \param DoGradient (1 = yes, 0 = no) whether gradient shall be calculated or not
	616	* \param first recaculate HGDensity (1) or not (0)
	617	* \note DensityTypes#ActualPsiDensity must be recent for gradient calculation!
	618	* \sa CalculateGradientNoRT() - same procedure for evaluation of \f${\cal H}^{(0)}\| \varphi_l^{(1)} \rangle\f$
	619	* \note without the simplification of \f$2 {\cal R} \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle\f$ the
	620	* calculation would be impossible due to non-local nature of perturbed wave functions. The position operator would
	621	* be impossible to apply in a sensible manner.
	622	*/
	623	void CalculatePerturbedEnergy(struct Problem *P, const int l, const int DoGradient, const int first)
	624	{
	625	struct Lattice *Lat = &P->Lat;
	626	struct Psis *Psi = &Lat->Psi;
	627	struct Energy *E = Lat->E;
	628	struct PseudoPot *PP = &P->PP;
	629	struct RunStruct *R = &P->R;
	630	struct LatticeLevel *LevS = R->LevS;
	631	const int state = R->CurrentMin;
	632	const int l_normal = Psi->TypeStartIndex[Occupied] + (l - Psi->TypeStartIndex[state]); // offset l to \varphi_l^{(0)}
	633	const int ActNum = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[l].my_color_comm_ST_Psi;
	634	int g, i, m, j;
	635	double lambda, Lambda;
	636	double RElambda10, RELambda10;
	637	const fftw_complex *source = LevS->LPsi->LocalPsi[l];
	638	fftw_complex *grad = P->Grad.GradientArray[ActualGradient];
	639	fftw_complex *Hc_grad = P->Grad.GradientArray[HcGradient];
	640	fftw_complex *H1c_grad = P->Grad.GradientArray[H1cGradient];
	641	fftw_complex *TempPsi_0 = H1c_grad;
	642	fftw_complex varphi_1, varphi_0;
	643	struct OnePsiElement OnePsiB, LOnePsiB;
	644	fftw_complex *LPsiDatB=NULL;
	645	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
	646	int RecvSource;
	647	MPI_Status status;
	648
	649	// ============ Calculate H^(0) psi^(1) =============================
	650	//if (Hc_grad != P->Grad.GradientArray[HcGradient]) Error(SomeError,"CalculatePerturbedEnergy: Hc_grad corrupted");
	651	SetArrayToDouble0((double )Hc_grad,2R->InitLevS->MaxG);
	652	ApplyTotalHamiltonian(P,source,Hc_grad, PP->fnl[l], 1, first);
	653
	654	// ============ ENERGY FUNCTIONAL Evaluation PART 1 ================
	655	//if (l_normal < 0 \|\| l_normal >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l_normal out of range");
	656	varphi_0 = LevS->LPsi->LocalPsi[l_normal];
	657	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
	658	varphi_1 = LevS->LPsi->LocalPsi[l];
	659	//if (TempPsi_0 != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"CalculatePerturbedEnergy: TempPsi_0 corrupted");
	660	SetArrayToDouble0((double )TempPsi_0,2R->InitLevS->MaxG);
	661	switch (state) {
	662	case Perturbed_P0:
	663	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,0); // \nabla_0 \| \varphi_l^{(0)} \rangle
	664	break;
	665	case Perturbed_P1:
	666	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,1); // \nabla_1 \| \varphi_l^{(0)} \rangle
	667	break;
	668	case Perturbed_P2:
	669	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,2); // \nabla_1 \| \varphi_l^{(0)} \rangle
	670	break;
	671	case Perturbed_RxP0:
	672	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,0); // r \times \nabla \| \varphi_l^{(0)} \rangle
	673	break;
	674	case Perturbed_RxP1:
	675	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,1); // r \times \nabla \| \varphi_l^{(0)} \rangle
	676	break;
	677	case Perturbed_RxP2:
	678	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,2); // r \times \nabla \| \varphi_l^{(0)} \rangle
	679	break;
	680	default:
	681	fprintf(stderr,"(%i) CalculatePerturbedEnergy called whilst not within perturbation run: CurrentMin = %i !\n",P->Par.me, R->CurrentMin);
	682	break;
	683	}
	684
	685	// ============ GRADIENT and EIGENVALUE Evaluation Part 1==============
	686	lambda = 0.0;
	687	if ((DoGradient) && (grad != NULL)) {
	688	g = 0;
	689	if (LevS->GArray[0].GSq == 0.0) {
	690	lambda += Hc_grad[0].re*source[0].re;
	691	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
	692	grad[0].re = -(Hc_grad[0].re + TempPsi_0[0].re);
	693	grad[0].im = -(Hc_grad[0].im + TempPsi_0[0].im);
	694	g++;
	695	}
	696	for (;g<LevS->MaxG;g++) {
	697	lambda += 2.(Hc_grad[g].resource[g].re + Hc_grad[g].im*source[g].im);
	698	//if (grad != P->Grad.GradientArray[ActualGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
	699	grad[g].re = -(Hc_grad[g].re + TempPsi_0[g].re);
	700	grad[g].im = -(Hc_grad[g].im + TempPsi_0[g].im);
	701	}
	702
	703	m = -1;
	704	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
	705	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
	706	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
	707	m++; // increase m if it is type-specific wave function
	708	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
	709	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
	710	else
	711	LOnePsiB = NULL;
	712	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
	713	RecvSource = OnePsiB->my_color_comm_ST_Psi;
	714	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, PerturbedTag, P->Par.comm_ST_PsiT, &status );
	715	LPsiDatB=LevS->LPsi->TempPsi;
	716	} else { // .. otherwise send it to all other processes (Max_me... - 1)
	717	for (i=0;i<P->Par.Max_me_comm_ST_PsiT;i++)
	718	if (i != OnePsiB->my_color_comm_ST_Psi)
	719	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, i, PerturbedTag, P->Par.comm_ST_PsiT);
	720	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
	721	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
	722
	723	g = 0;
	724	if (LevS->GArray[0].GSq == 0.0) { // perform the summation
	725	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
	726	grad[0].re += Lat->Psi.lambda[ActNum][m]*LPsiDatB[0].re;
	727	grad[0].im += Lat->Psi.lambda[ActNum][m]*LPsiDatB[0].im;
	728	g++;
	729	}
	730	for (;g<LevS->MaxG;g++) {
	731	//if (grad != P->Grad.GradientArray[ActualGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
	732	grad[g].re += Lat->Psi.lambda[ActNum][m]*LPsiDatB[g].re;
	733	grad[g].im += Lat->Psi.lambda[ActNum][m]*LPsiDatB[g].im;
	734	}
	735	}
	736	}
	737	} else {
	738	lambda = GradSP(P,LevS,Hc_grad,source);
	739	}
	740	MPI_Allreduce ( &lambda, &Lambda, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	741	//fprintf(stderr,"(%i) Lambda[%i] = %lg\n",P->Par.me, l, Lambda);
	742	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
	743	Lat->Psi.AddData[l].Lambda = Lambda;
	744
	745	// ============ ENERGY FUNCTIONAL Evaluation PART 2 ================
	746	// varphi_1 jas negative symmetry, returning TempPsi_0 from CalculatePerturbedOperator also, thus real part of scalar product
	747	// "-" due to purely imaginary wave function is on left hand side, thus becomes complex conjugated: i -> -i
	748	// (-i goes into pert. op., "-" remains when on right hand side)
	749	RElambda10 = GradSP(P,LevS,varphi_1,TempPsi_0) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * Psi->LocalPsiStatus[l_normal].PsiFactor);
	750	//RElambda01 = -GradSP(P,LevS,varphi_0,TempPsi_1) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * Psi->LocalPsiStatus[l_normal].PsiFactor);
	751
	752	MPI_Allreduce ( &RElambda10, &RELambda10, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	753	//MPI_Allreduce ( &RElambda01, &RELambda01, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	754
	755	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
	756	E->PsiEnergy[Perturbed1_0Energy][l] = RELambda10;
	757	E->PsiEnergy[Perturbed0_1Energy][l] = RELambda10;
	758	// if (P->Par.me == 0) {
	759	// fprintf(stderr,"RE.Lambda10[%i-%i] = %lg\t RE.Lambda01[%i-%i] = %lg\n", l, l_normal, RELambda10, l_normal, l, RELambda01);
	760	// }
	761	// GradImSP() is only applicable to a product of wave functions with uneven symmetry!
	762	// Otherwise, due to the nature of symmetry, a sum over only half of the coefficients will in most cases not result in zero!
	763	}
	764
	765	/** Applies \f$H^{(0)}\f$ to a given \a source.
	766	* The DensityTypes#HGDensity is computed, the exchange potential added and the
	767	* whole multiplied - coefficient by coefficient - with the current wave function, taken from its density coefficients,
	768	* on the upper LatticeLevel (RunStruct#Lev0), which (DensityTypes#ActualPsiDensity) is updated beforehand.
	769	* After an inverse fft (now G-dependent) the non-local potential is added and
	770	* within the reciprocal basis set, the kinetic energy can be evaluated easily.
	771	* \param *P Problem at hand
	772	* \param *source pointer to source coefficient array, \f$\| \varphi(G) \rangle\f$
	773	* \param *dest pointer to dest coefficient array,\f$H^{(0)} \| \varphi(G) \rangle\f$
	774	* \param **fnl pointer to non-local form factor array
	775	* \param PsiFactor occupation number of orbital
	776	* \param first 1 - Re-calculate DensityTypes#HGDensity, 0 - don't
	777	* \sa CalculateConDirHConDir() - same procedure
	778	*/
	779	void ApplyTotalHamiltonian(struct Problem P, const fftw_complex source, fftw_complex dest, fftw_complex **fnl, const double PsiFactor, const int first) {
	780	struct Lattice *Lat = &P->Lat;
	781	struct RunStruct *R = &P->R;
	782	struct LatticeLevel *LevS = R->LevS;
	783	struct LatticeLevel *Lev0 = R->Lev0;
	784	struct Density *Dens0 = Lev0->Dens;
	785	struct fft_plan_3d *plan = Lat->plan;
	786	struct PseudoPot *PP = &P->PP;
	787	struct Ions *I = &P->Ion;
	788	fftw_complex *work = Dens0->DensityCArray[TempDensity];
	789	fftw_real *HGcR = Dens0->DensityArray[HGcDensity];
	790	fftw_complex HGcRC = (fftw_complex)HGcR;
	791	fftw_complex *HGC = Dens0->DensityCArray[HGDensity];
	792	fftw_real HGCR = (fftw_real )HGC;
	793	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
	794	fftw_real PsiCR = (fftw_real )PsiC;
	795	//const fftw_complex *dest_bak = dest;
	796	int nx,ny,nz,iS,i0;
	797	const int Nx = LevS->Plan0.plan->local_nx;
	798	const int Ny = LevS->Plan0.plan->N[1];
	799	const int Nz = LevS->Plan0.plan->N[2];
	800	const int NUpx = LevS->NUp[0];
	801	const int NUpy = LevS->NUp[1];
	802	const int NUpz = LevS->NUp[2];
	803	const double HGcRCFactor = 1./LevS->MaxN;
	804	int g, Index, i, it;
	805	fftw_complex vp,rp,rhog,TotalPsiDensity;
	806	double Fac;
	807
	808	if (first) {
	809	// recalculate HGDensity
	810	//if (HGC != Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
	811	SetArrayToDouble0((double )HGC,2Dens0->TotalSize);
	812	g=0;
	813	if (Lev0->GArray[0].GSq == 0.0) {
	814	Index = Lev0->GArray[0].Index;
	815	c_re(vp) = 0.0;
	816	c_im(vp) = 0.0;
	817	for (it = 0; it < I->Max_Types; it++) {
	818	c_re(vp) += (c_re(I->I[it].SFactor[0])*PP->phi_ps_loc[it][0]);
	819	c_im(vp) += (c_im(I->I[it].SFactor[0])*PP->phi_ps_loc[it][0]);
	820	}
	821	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
	822	c_re(HGC[Index]) = c_re(vp);
	823	c_re(TotalPsiDensity) = c_re(Dens0->DensityCArray[TotalDensity][Index]);
	824	c_im(TotalPsiDensity) = c_im(Dens0->DensityCArray[TotalDensity][Index]);
	825
	826	g++;
	827	}
	828	for (; g < Lev0->MaxG; g++) {
	829	Index = Lev0->GArray[g].Index;
	830	Fac = 4.*PI/(Lev0->GArray[g].GSq);
	831	c_re(vp) = 0.0;
	832	c_im(vp) = 0.0;
	833	c_re(rp) = 0.0;
	834	c_im(rp) = 0.0;
	835	for (it = 0; it < I->Max_Types; it++) {
	836	c_re(vp) += (c_re(I->I[it].SFactor[g])*PP->phi_ps_loc[it][g]);
	837	c_im(vp) += (c_im(I->I[it].SFactor[g])*PP->phi_ps_loc[it][g]);
	838	c_re(rp) += (c_re(I->I[it].SFactor[g])*PP->FacGauss[it][g]);
	839	c_im(rp) += (c_im(I->I[it].SFactor[g])*PP->FacGauss[it][g]);
	840	} // rp = n^{Gauss)(G)
	841
	842	// n^{tot} = n^0 + \lambda n^1 + ...
	843	//if (isnan(c_re(Dens0->DensityCArray[TotalDensity][Index]))) { fprintf(stderr,"(%i) WARNING in CalculatePerturbedEnergy(): TotalDensity[%i] = NaN!\n", P->Par.me, Index); Error(SomeError, "NaN-Fehler!"); }
	844	c_re(TotalPsiDensity) = c_re(Dens0->DensityCArray[TotalDensity][Index]);
	845	c_im(TotalPsiDensity) = c_im(Dens0->DensityCArray[TotalDensity][Index]);
	846
	847	c_re(rhog) = c_re(TotalPsiDensity)*R->HGcFactor+c_re(rp);
	848	c_im(rhog) = c_im(TotalPsiDensity)*R->HGcFactor+c_im(rp);
	849	// rhog = n(G) + n^{Gauss}(G), rhoe = n(G)
	850	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
	851	c_re(HGC[Index]) = c_re(vp)+Fac*c_re(rhog);
	852	c_im(HGC[Index]) = c_im(vp)+Fac*c_im(rhog);
	853	}
	854	//
	855	for (i=0; i<Lev0->MaxDoubleG; i++) {
	856	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Lev0->DoubleG[2i+1]<0 \|\| Lev0->DoubleG[2i+1]>Dens0->LocalSizeC \|\| Lev0->DoubleG[2i]<0 \|\| Lev0->DoubleG[2i]>Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
	857	HGC[Lev0->DoubleG[2i+1]].re = HGC[Lev0->DoubleG[2i]].re;
	858	HGC[Lev0->DoubleG[2i+1]].im = -HGC[Lev0->DoubleG[2i]].im;
	859	}
	860	}
	861	// ============ GRADIENT and EIGENVALUE Evaluation Part 1==============
	862	// \lambda_l^{(1)} = \langle \varphi_l^{(1)} \| H^{(0)} \| \varphi_l^{(1)} \rangle and gradient calculation
	863	SpeedMeasure(P, LocTime, StartTimeDo);
	864	// back-transform HGDensity: (G) -> (R)
	865	//if (HGC != Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
	866	if (first) fft_3d_complex_to_real(plan, Lev0->LevelNo, FFTNF1, HGC, work);
	867	// evaluate exchange potential with this density, add up onto HGCR
	868	//if (HGCR != (fftw_real *)Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGCR corrupted");
	869	if (first) CalculateXCPotentialNoRT(P, HGCR); // add V^{xc} on V^H + V^{ps}
	870	// make sure that ActualPsiDensity is recent
	871	CalculateOneDensityR(Lat, LevS, Dens0, source, Dens0->DensityArray[ActualDensity], R->FactorDensityR*PsiFactor, 1);
	872	for (nx=0;nx<Nx;nx++)
	873	for (ny=0;ny<Ny;ny++)
	874	for (nz=0;nz<Nz;nz++) {
	875	i0 = nzNUpz+NzNUpz(nyNUpy+NyNUpynx*NUpx);
	876	iS = nz+Nz(ny+Nynx);
	877	//if (HGcR != Dens0->DensityArray[HGcDensity] \|\| iS<0 \|\| iS>=LevS->Dens->LocalSizeR) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
	878	HGcR[iS] = HGCR[i0]PsiCR[i0]; / Matrix Vector Mult */
	879	}
	880	// (R) -> (G)
	881	//if (HGcRC != (fftw_complex *)Dens0->DensityArray[HGcDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGcRC corrupted");
	882	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, HGcRC, work);
	883	SpeedMeasure(P, LocTime, StopTimeDo);
	884	/* NonLocalPP */
	885	SpeedMeasure(P, NonLocTime, StartTimeDo);
	886	//if (dest != dest_bak) Error(SomeError,"ApplyTotalHamiltonian: dest corrupted");
	887	CalculateAddNLPot(P, dest, fnl, PsiFactor); // wave function hidden in form factors fnl, also resets Hc_grad beforehand
	888	SpeedMeasure(P, NonLocTime, StopTimeDo);
	889
	890	/* create final vector */
	891	for (g=0;g<LevS->MaxG;g++) {
	892	Index = LevS->GArray[g].Index; /* FIXME - factoren */
	893	//if (dest != dest_bak \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"ApplyTotalHamiltonian: dest corrupted");
	894	dest[g].re += PsiFactor(HGcRC[Index].reHGcRCFactor + 0.5LevS->GArray[g].GSqsource[g].re);
	895	dest[g].im += PsiFactor(HGcRC[Index].imHGcRCFactor + 0.5LevS->GArray[g].GSqsource[g].im);
	896	}
	897	}
	898
	899	#define stay_above 0.001 //!< value above which the coefficient of the wave function will always remain
	900
	901	/** Finds the minimum of perturbed energy in regards of actual wave function.
	902	* The following happens step by step:
	903	* -# The Gradient is copied into GradientTypes#GraSchGradient (which is nothing but a pointer to
	904	* one array in LPsiDat) and orthonormalized via GramSch() to all occupied wave functions
	905	* except to the current perturbed one.
	906	* -# Then comes pre-conditioning, analogous to CalculatePreConGrad().
	907	* -# The Gradient is projected onto the current perturbed wave function and this is subtracted, i.e.
	908	* vector is the conjugate gradient.
	909	* -# Finally, Calculate1stPerturbedDerivative() and Calculate2ndPerturbedDerivative() are called and
	910	* with these results and the current total energy, CalculateDeltaI() finds the parameter for the one-
	911	* dimensional minimisation. The current wave function is set to newly found minimum and approximated
	912	* total energy is printed.
	913	*
	914	* \param *P Problem at hand
	915	* \sa CalculateNewWave() and functions therein
	916	*/
	917	void FindPerturbedMinimum(struct Problem *P)
	918	{
	919	struct Lattice *Lat = &P->Lat;
	920	struct RunStruct *R = &P->R;
	921	struct Psis *Psi = &Lat->Psi;
	922	struct PseudoPot *PP = &P->PP;
	923	struct LatticeLevel *LevS = R->LevS;
	924	struct LatticeLevel *Lev0 = R->Lev0;
	925	struct Density *Dens = Lev0->Dens;
	926	struct Energy *En = Lat->E;
	927	struct FileData *F = &P->Files;
	928	int g,p,i;
	929	int step = R->PsiStep;
	930	double *GammaDiv = &Lat->Psi.AddData[R->ActualLocalPsiNo].Gamma;
	931	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
	932	fftw_complex *source = LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
	933	fftw_complex *grad = P->Grad.GradientArray[ActualGradient];
	934	fftw_complex *GradOrtho = P->Grad.GradientArray[GraSchGradient];
	935	fftw_complex *PCgrad = P->Grad.GradientArray[PreConGradient];
	936	fftw_complex *PCOrtho = P->Grad.GradientArray[GraSchGradient];
	937	fftw_complex *ConDir = P->Grad.GradientArray[ConDirGradient];
	938	fftw_complex *ConDir_old = P->Grad.GradientArray[OldConDirGradient];
	939	fftw_complex *Ortho = P->Grad.GradientArray[GraSchGradient];
	940	const fftw_complex *Hc_grad = P->Grad.GradientArray[HcGradient];
	941	const fftw_complex *H1c_grad = P->Grad.GradientArray[H1cGradient];
	942	fftw_complex *HConDir = Dens->DensityCArray[ActualDensity];
	943	const double PsiFactor = Lat->Psi.LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
	944	//double Lambda = Lat->Psi.AddData[R->ActualLocalPsiNo].Lambda;
	945	double T;
	946	double x, K; //, dK;
	947	double dS[2], S[2], Gamma, GammaDivOld = *GammaDiv;
	948	double LocalSP, PsiSP;
	949	double dEdt0, ddEddt0, ConDirHConDir, ConDirConDir;//, sourceHsource;
	950	double E0, E, delta;
	951	//double E0, E, dE, ddE, delta, dcos, dsin;
	952	//double EI, dEI, ddEI, deltaI, dcosI, dsinI;
	953	//double HartreeddEddt0, XCddEddt0;
	954	double d[4],D[4], Diff;
	955	const int Num = Psi->NoOfPsis;
	956
	957	// ORTHOGONALIZED-GRADIENT
	958	for (g=0;g<LevS->MaxG;g++) {
	959	//if (GradOrtho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: GradOrtho corrupted");
	960	GradOrtho[g].re = grad[g].re; //+Lambda*source[g].re;
	961	GradOrtho[g].im = grad[g].im; //+Lambda*source[g].im;
	962	}
	963	// include the ExtraPsi (which is the GraSchGradient!)
	964	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
	965	// exclude the minimised Psi
	966	SetGramSchActualPsi(P, Psi, NotUsedToOrtho);
	967	SpeedMeasure(P, GramSchTime, StartTimeDo);
	968	// makes conjugate gradient orthogonal to all other orbits
	969	//fprintf(stderr,"CalculateCGGradient: GramSch() for extra orbital\n");
	970	GramSch(P, LevS, Psi, Orthogonalize);
	971	SpeedMeasure(P, GramSchTime, StopTimeDo);
	972	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"FindPerturbedMinimum: grad corrupted");
	973	memcpy(grad, GradOrtho, ElementSizeLevS->MaxGsizeof(double));
	974	//memcpy(PCOrtho, GradOrtho, ElementSizeLevS->MaxGsizeof(double));
	975
	976	// PRE-CONDITION-GRADIENT
	977	//if (fabs(T) < MYEPSILON) T = 1;
	978	T = 0.;
	979	for (i=0;i<Num;i++)
	980	T += Psi->lambda[i][i];
	981	for (g=0;g<LevS->MaxG;g++) {
	982	x = .5*LevS->GArray[g].GSq;
	983	// FIXME: Good way of accessing reciprocal Lev0 Density coefficients on LevS! (not so trivial)
	984	//x += sqrt(Dens->DensityCArray[HGDensity][g].reDens->DensityCArray[HGDensity][g].re+Dens->DensityCArray[HGDensity][g].imDens->DensityCArray[HGDensity][g].im);
	985	x -= T/(double)Num;
	986	K = x/(xx+stay_abovestay_above);
	987	//if (PCOrtho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: PCOrtho corrupted");
	988	c_re(PCOrtho[g]) = K*c_re(grad[g]);
	989	c_im(PCOrtho[g]) = K*c_im(grad[g]);
	990	}
	991	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
	992	SpeedMeasure(P, GramSchTime, StartTimeDo);
	993	// preconditioned direction is orthogonalized
	994	//fprintf(stderr,"CalculatePreConGrad: GramSch() for extra orbital\n");
	995	GramSch(P, LevS, Psi, Orthogonalize);
	996	SpeedMeasure(P, GramSchTime, StopTimeDo);
	997	//if (PCgrad != P->Grad.GradientArray[PreConGradient]) Error(SomeError,"FindPerturbedMinimum: PCgrad corrupted");
	998	memcpy(PCgrad, PCOrtho, ElementSizeLevS->MaxGsizeof(double));
	999
	1000	//debug(P, "Before ConDir");
	1001	//fprintf(stderr,"\|(%i)\|^2 = %lg\t \|PCgrad\|^2 = %lg\t \|PCgrad,(%i)\| = %lg\n", R->ActualLocalPsiNo, GradSP(P,LevS,source,source),GradSP(P,LevS,PCgrad,PCgrad), R->ActualLocalPsiNo, GradSP(P,LevS,PCgrad,source));
	1002	// CONJUGATE-GRADIENT
	1003	LocalSP = GradSP(P, LevS, PCgrad, grad);
	1004	MPI_Allreduce ( &LocalSP, &PsiSP, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1005	*GammaDiv = dS[0] = PsiSP;
	1006	dS[1] = GammaDivOld;
	1007	S[0]=dS[0]; S[1]=dS[1];
	1008	/MPI_Allreduce ( dS, S, 2, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_PsiT);/
	1009	if (step) { // only in later steps is the scalar product used, but always condir stored in oldcondir and Ortho (working gradient)
	1010	if (fabs(S[1]) < MYEPSILON) fprintf(stderr,"CalculateConDir: S[1] = %lg\n",S[1]);
	1011	Gamma = S[0]/S[1];
	1012	if (fabs(S[1]) < MYEPSILON) {
	1013	if (fabs(S[0]) < MYEPSILON)
	1014	Gamma = 1.0;
	1015	else
	1016	Gamma = 0.0;
	1017	}
	1018	for (g=0; g < LevS->MaxG; g++) {
	1019	//if (ConDir != P->Grad.GradientArray[ConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1020	c_re(ConDir[g]) = c_re(PCgrad[g]) + Gamma*c_re(ConDir_old[g]);
	1021	c_im(ConDir[g]) = c_im(PCgrad[g]) + Gamma*c_im(ConDir_old[g]);
	1022	//if (ConDir_old != P->Grad.GradientArray[OldConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir_old corrupted");
	1023	c_re(ConDir_old[g]) = c_re(ConDir[g]);
	1024	c_im(ConDir_old[g]) = c_im(ConDir[g]);
	1025	//if (Ortho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: Ortho corrupted");
	1026	c_re(Ortho[g]) = c_re(ConDir[g]);
	1027	c_im(Ortho[g]) = c_im(ConDir[g]);
	1028	}
	1029	} else {
	1030	Gamma = 0.0;
	1031	for (g=0; g < LevS->MaxG; g++) {
	1032	//if (ConDir != P->Grad.GradientArray[ConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1033	c_re(ConDir[g]) = c_re(PCgrad[g]);
	1034	c_im(ConDir[g]) = c_im(PCgrad[g]);
	1035	//if (ConDir_old != P->Grad.GradientArray[OldConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir_old corrupted");
	1036	c_re(ConDir_old[g]) = c_re(ConDir[g]);
	1037	c_im(ConDir_old[g]) = c_im(ConDir[g]);
	1038	//if (Ortho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: Ortho corrupted");
	1039	c_re(Ortho[g]) = c_re(ConDir[g]);
	1040	c_im(Ortho[g]) = c_im(ConDir[g]);
	1041	}
	1042	}
	1043	// orthonormalize
	1044	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
	1045	SpeedMeasure(P, GramSchTime, StartTimeDo);
	1046	//fprintf(stderr,"CalculateConDir: GramSch() for extra orbital\n");
	1047	GramSch(P, LevS, Psi, Orthogonalize);
	1048	SpeedMeasure(P, GramSchTime, StopTimeDo);
	1049	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1050	memcpy(ConDir, Ortho, ElementSizeLevS->MaxGsizeof(double));
	1051	//debug(P, "Before LineSearch");
	1052	//fprintf(stderr,"\|(%i)\|^2 = %lg\t \|ConDir\|^2 = %lg\t \|ConDir,(%i)\| = %lg\n", R->ActualLocalPsiNo, GradSP(P,LevS,source,source),GradSP(P,LevS,ConDir,ConDir), R->ActualLocalPsiNo, GradSP(P,LevS,ConDir,source));
	1053	SetGramSchActualPsi(P, Psi, IsOrthogonal);
	1054
	1055	//fprintf(stderr,"(%i) Testing conjugate gradient for Orthogonality ...\n", P->Par.me);
	1056	//TestForOrth(P,LevS,ConDir);
	1057
	1058	// ONE-DIMENSIONAL LINE-SEARCH
	1059
	1060	// ========= dE / dt \| 0 ============
	1061	p = Lat->Psi.TypeStartIndex[Occupied] + (R->ActualLocalPsiNo - Lat->Psi.TypeStartIndex[R->CurrentMin]);
	1062	//if (Hc_grad != P->Grad.GradientArray[HcGradient]) Error(SomeError,"FindPerturbedMinimum: Hc_grad corrupted");
	1063	//if (H1c_grad != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"FindPerturbedMinimum: H1c_grad corrupted");
	1064	d[0] = Calculate1stPerturbedDerivative(P, LevS->LPsi->LocalPsi[p], source, ConDir, Hc_grad, H1c_grad);
	1065	//CalculateConDirHConDir(P, ConDir, PsiFactor, &d[1], &d[2], &d[3]);
	1066	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1067	CalculateCDfnl(P, ConDir, PP->CDfnl); // calculate needed non-local form factors
	1068	//if (HConDir != Dens->DensityCArray[ActualDensity]) Error(SomeError,"FindPerturbedMinimum: HConDir corrupted");
	1069	SetArrayToDouble0((double )HConDir,Dens->TotalSize2);
	1070	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1071	ApplyTotalHamiltonian(P,ConDir,HConDir, PP->CDfnl, PsiFactor, 0); // applies H^(0) with total perturbed density!
	1072	d[1] = GradSP(P,LevS,ConDir,HConDir);
	1073	d[2] = GradSP(P,LevS,ConDir,ConDir);
	1074	d[3] = 0.;
	1075
	1076	// gather results
	1077	MPI_Allreduce ( &d, &D, 4, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1078	// ========== ddE / ddt \| 0 =========
	1079	dEdt0 = D[0];
	1080	for (i=MAXOLD-1; i > 0; i--)
	1081	En->dEdt0[i] = En->dEdt0[i-1];
	1082	En->dEdt0[0] = dEdt0;
	1083	ConDirHConDir = D[1];
	1084	ConDirConDir = D[2];
	1085	ddEddt0 = 0.0;
	1086	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
	1087	//if (H1c_grad != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"FindPerturbedMinimum: H1c_grad corrupted");
	1088	ddEddt0 = Calculate2ndPerturbedDerivative(P, LevS->LPsi->LocalPsi[p], source, ConDir, Lat->Psi.AddData[R->ActualLocalPsiNo].Lambda * Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor, ConDirHConDir, ConDirConDir);
	1089
	1090	for (i=MAXOLD-1; i > 0; i--)
	1091	En->ddEddt0[i] = En->ddEddt0[i-1];
	1092	En->ddEddt0[0] = ddEddt0;
	1093	E0 = En->TotalEnergy[0];
	1094	// delta
	1095	//if (isnan(E0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): E0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
	1096	//if (isnan(dEdt0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): dEdt0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
	1097	//if (isnan(ddEddt0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): ddEddt0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
	1098
	1099	////deltaI = CalculateDeltaI(E0, dEdt0, ddEddt0,
	1100	//// &EI, &dEI, &ddEI, &dcosI, &dsinI);
	1101	////delta = deltaI; E = EI; dE = dEI; ddE = ddEI; dcos = dcosI; dsin = dsinI;
	1102	if (ddEddt0 > 0) {
	1103	delta = - dEdt0/ddEddt0;
	1104	E = E0 + delta * dEdt0 + deltadelta/2. ddEddt0;
	1105	} else {
	1106	delta = 0.;
	1107	E = E0;
	1108	fprintf(stderr,"(%i) Taylor approximation leads not to minimum!\n",P->Par.me);
	1109	}
	1110
	1111	// shift energy delta values
	1112	for (i=MAXOLD-1; i > 0; i--) {
	1113	En->delta[i] = En->delta[i-1];
	1114	En->ATE[i] = En->ATE[i-1];
	1115	}
	1116	// store new one
	1117	En->delta[0] = delta;
	1118	En->ATE[0] = E;
	1119	if (En->TotalEnergy[1] != 0.)
	1120	Diff = fabs(En->TotalEnergy[1] - E0)/(En->TotalEnergy[1] - E0)*fabs((E0 - En->ATE[1])/E0);
	1121	else
	1122	Diff = 0.;
	1123	R->Diffcount += pow(Diff,2);
	1124
	1125	// reinstate actual density (only needed for UpdateDensityCalculation) ...
	1126	//CalculateOneDensityR(Lat, LevS, Dens, source, Dens->DensityArray[ActualDensity], R->FactorDensityR*Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor, 1);
	1127	// ... before changing actual local Psi
	1128	for (g = 0; g < LevS->MaxG; g++) { // Here all coefficients are updated for the new found wave function
	1129	//if (isnan(ConDir[g].re)) { fprintf(stderr,"WARNGING: CalculateLineSearch(): ConDir_%i(%i) = NaN!\n", R->ActualLocalPsiNo, g); Error(SomeError, "NaN-Fehler!"); }
	1130	//if (source != LevS->LPsi->LocalPsi[R->ActualLocalPsiNo] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: source corrupted");
	1131	////c_re(source[g]) = c_re(source[g])dcos + c_re(ConDir[g])dsin;
	1132	////c_im(source[g]) = c_im(source[g])dcos + c_im(ConDir[g])dsin;
	1133	c_re(source[g]) = c_re(source[g]) + c_re(ConDir[g])*delta;
	1134	c_im(source[g]) = c_im(source[g]) + c_im(ConDir[g])*delta;
	1135	}
	1136	if (P->Call.out[StepLeaderOut]) {
	1137	fprintf(stderr, "(%i,%i,%i)S(%i,%i,%i):\tTE: %e\tATE: %e\t Diff: %e\t --- d: %e\tdEdt0: %e\tddEddt0: %e\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, E0, E, Diff,delta, dEdt0, ddEddt0);
	1138	//fprintf(stderr, "(%i,%i,%i)S(%i,%i,%i):\tp0: %e p1: %e p2: %e \tATE: %e\t Diff: %e\t --- d: %e\tdEdt0: %e\tddEddt0: %e\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, En->parts[0], En->parts[1], En->parts[2], E, Diff,delta, dEdt0, ddEddt0);
	1139	}
	1140	if (P->Par.me == 0) {
	1141	fprintf(F->MinimisationFile, "%i\t%i\t%i\t%e\t%e\t%e\t%e\t%e\n",R->MinStep, R->ActualLocalPsiNo, R->PsiStep, E0, E, delta, dEdt0, ddEddt0);
	1142	fflush(F->MinimisationFile);
	1143	}
	1144	}
	1145
	1146	/** Applies perturbation operator \f$\nabla_{index}\f$ to \a *source.
	1147	* As wave functions are stored in the reciprocal basis set, the application is straight-forward,
	1148	* for every G vector, the by \a index specified component is multiplied with the respective
	1149	* coefficient. Afterwards, 1/i is applied by flipping real and imaginary components (and an additional minus sign on the new imaginary term).
	1150	* \param *P Problem at hand
	1151	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
	1152	* \param *dest returned complex coefficients of wave function \f$\widehat{p}_{index}\|\varphi(G)\f$
	1153	* \param index_g vectorial index of operator to be applied
	1154	*/
	1155	void CalculatePerturbationOperator_P(struct Problem P, const fftw_complex source, fftw_complex *dest, const int index_g)
	1156	{
	1157	struct RunStruct *R = &P->R;
	1158	struct LatticeLevel *LevS = R->LevS;
	1159	//const fftw_complex *dest_bak = dest;
	1160	int g = 0;
	1161	if (LevS->GArray[0].GSq == 0.0) {
	1162	//if (dest != dest_bak) Error(SomeError,"CalculatePerturbationOperator_P: dest corrupted");
	1163	dest[0].re = LevS->GArray[0].G[index_g]*source[0].im;
	1164	dest[0].im = -LevS->GArray[0].G[index_g]*source[0].re;
	1165	g++;
	1166	}
	1167	for (;g<LevS->MaxG;g++) {
	1168	//if (dest != dest_bak \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbationOperator_P: g out of range");
	1169	dest[g].re = LevS->GArray[g].G[index_g]*source[g].im;
	1170	dest[g].im = -LevS->GArray[g].G[index_g]*source[g].re;
	1171	}
	1172	// don't put dest[0].im = 0! Otherwise real parts of perturbed01/10 are not the same anymore!
	1173	}
	1174
	1175	/** Applies perturbation operator \f$\widehat{r}_{index}\f$ to \a *source.
	1176	* The \a *source wave function is blown up onto upper level LatticeLevel RunStruct#Lev0, fourier
	1177	* transformed. Afterwards, for each point on the real mesh the coefficient is multiplied times the real
	1178	* vector pointing within the cell to the mesh point, yet on LatticeLevel RunStruct#LevS. The new wave
	1179	* function is inverse fourier transformed and the resulting reciprocal coefficients stored in *dest.
	1180	* \param *P Problem at hand
	1181	* \param *source source coefficients
	1182	* \param *source2 second source coefficients, e.g. in the evaluation of a scalar product
	1183	* \param *dest destination coefficienta array, is overwrittten!
	1184	* \param index_r index of real vector.
	1185	* \param wavenr index of respective PsiTypeTag#Occupied(!) OnePsiElementAddData for the needed Wanner centre of the wave function.
	1186	*/
	1187	void CalculatePerturbationOperator_R(struct Problem P, const fftw_complex source, fftw_complex dest, const fftw_complex source2, const int index_r, const int wavenr)
	1188	{
	1189	struct Lattice *Lat = &P->Lat;
	1190	struct RunStruct *R = &P->R;
	1191	struct LatticeLevel *Lev0 = R->Lev0;
	1192	struct LatticeLevel *LevS = R->LevS;
	1193	struct Density *Dens0 = Lev0->Dens;
	1194	struct fft_plan_3d *plan = Lat->plan;
	1195	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
	1196	fftw_real TempPsiR = (fftw_real ) TempPsi;
	1197	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
	1198	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
	1199	fftw_real PsiCR = (fftw_real ) PsiC;
	1200	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[TempDensity];
	1201	fftw_complex posfac, destsnd, *destrcv;
	1202	double x[NDIM], fac[NDIM], Wcentre[NDIM];
	1203	const int k_normal = Lat->Psi.TypeStartIndex[Occupied] + (wavenr - Lat->Psi.TypeStartIndex[R->CurrentMin]);
	1204	int n[NDIM], n0, g, Index, pos, iS, i0;
	1205	int N[NDIM], NUp[NDIM];
	1206	const int N0 = LevS->Plan0.plan->local_nx;
	1207	N[0] = LevS->Plan0.plan->N[0];
	1208	N[1] = LevS->Plan0.plan->N[1];
	1209	N[2] = LevS->Plan0.plan->N[2];
	1210	NUp[0] = LevS->NUp[0];
	1211	NUp[1] = LevS->NUp[1];
	1212	NUp[2] = LevS->NUp[2];
	1213	Wcentre[0] = Lat->Psi.AddData[k_normal].WannierCentre[0];
	1214	Wcentre[1] = Lat->Psi.AddData[k_normal].WannierCentre[1];
	1215	Wcentre[2] = Lat->Psi.AddData[k_normal].WannierCentre[2];
	1216	// init pointers and values
	1217	const int myPE = P->Par.me_comm_ST_Psi;
	1218	const double FFTFactor = 1./LevS->MaxN;
	1219	double vector;
	1220	//double result, Result;
	1221
	1222	// blow up source coefficients
	1223	LockDensityArray(Dens0,TempDensity,real); // tempdestRC
	1224	LockDensityArray(Dens0,Temp2Density,imag); // TempPsi
	1225	LockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
	1226	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
	1227	SetArrayToDouble0((double )tempdestRC ,Dens0->TotalSize2);
	1228	//if (TempPsi != Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculatePerturbationOperator_R: TempPsi corrupted");
	1229	SetArrayToDouble0((double )TempPsi ,Dens0->TotalSize2);
	1230	//if (PsiC != Dens0->DensityCArray[ActualPsiDensity]) Error(SomeError,"CalculatePerturbationOperator_R: PsiC corrupted");
	1231	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
	1232	for (g=0; g<LevS->MaxG; g++) {
	1233	Index = LevS->GArray[g].Index;
	1234	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
	1235	destrcv = &tempdestRC[LevS->MaxNUp*Index];
	1236	for (pos=0; pos < LevS->MaxNUp; pos++) {
	1237	//if (destrcv != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbationOperator_R: destrcv corrupted");
	1238	destrcv [pos].re = (( source[g].re)posfac[pos].re-(source[g].im)posfac[pos].im);
	1239	destrcv [pos].im = (( source[g].re)posfac[pos].im+(source[g].im)posfac[pos].re);
	1240	}
	1241	}
	1242	for (g=0; g<LevS->MaxDoubleG; g++) {
	1243	destsnd = &tempdestRC [LevS->DoubleG[2g]LevS->MaxNUp];
	1244	destrcv = &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp];
	1245	for (pos=0; pos<LevS->MaxNUp; pos++) {
	1246	//if (destrcv != &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp] \|\| LevS->DoubleG[2g]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2g]LevS->MaxNUp+pos>=Dens0->LocalSizeC\|\| LevS->DoubleG[2g+1]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2g+1]LevS->MaxNUp+pos>=Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbationOperator_R: destrcv corrupted");
	1247	destrcv [pos].re = destsnd [pos].re;
	1248	destrcv [pos].im = -destsnd [pos].im;
	1249	}
	1250	}
	1251	// fourier transform blown up wave function
	1252	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
	1253	//if (workC != Dens0->DensityCArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: workC corrupted");
	1254	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC , workC);
	1255	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
	1256	//if (TempPsiR != (fftw_real *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculatePerturbationOperator_R: TempPsiR corrupted");
	1257	DensityRTransformPos(LevS,(fftw_real*)tempdestRC ,TempPsiR );
	1258	UnLockDensityArray(Dens0,TempDensity,real); // TempdestRC
	1259
	1260	//result = 0.;
	1261	// for every point on the real grid multiply with component of position vector
	1262	for (n0=0; n0<N0; n0++)
	1263	for (n[1]=0; n[1]<N[1]; n[1]++)
	1264	for (n[2]=0; n[2]<N[2]; n[2]++) {
	1265	n[0] = n0 + N0 * myPE;
	1266	fac[0] = (double)(n[0])/(double)((N[0]));
	1267	fac[1] = (double)(n[1])/(double)((N[1]));
	1268	fac[2] = (double)(n[2])/(double)((N[2]));
	1269	RMat33Vec3(x,Lat->RealBasis,fac);
	1270	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
	1271	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	1272	//PsiCR[iS] = ((double)n[0]/(double)N[0]Lat->RealBasis[0] - fabs(Wcentre[0]))TempPsiR[i0] - ((double)n[1]/(double)N[1]Lat->RealBasis[4] - fabs(Wcentre[1]))TempPsi2R[i0];
	1273	//fprintf(stderr,"(%i) R[%i] = (%lg,%lg,%lg)\n",P->Par.me, i0, x[0], x[1], x[2]);
	1274	//else fprintf(stderr,"(%i) WCentre[%i] = %e \n",P->Par.me, index_r, Wcentre[index_r]);
	1275	vector = sawtooth(Lat,MinImageConv(Lat,x[index_r],Wcentre[index_r],index_r),index_r);
	1276	//vector = 1.;//sin((double)(n[index_r])/(double)((N[index_r]))2PI);
	1277	PsiCR[iS] = vector * TempPsiR[i0];
	1278	//fprintf(stderr,"(%i) vector(%i/%i,%i/%i,%i/%i): %lg\tx[%i] = %e\tWcentre[%i] = %e\tTempPsiR[%i] = %e\tPsiCR[%i] = %e\n",P->Par.me, n[0], N[0], n[1], N[1], n[2], N[2], vector, index_r, x[index_r],index_r, Wcentre[index_r],i0,TempPsiR[i0],iS,PsiCR[iS]);
	1279
	1280	//truedist(Lat,x[cross(index_r,2)],Wcentre[cross(index_r,2)],cross(index_r,2)) * TempPsiR[i0];
	1281	//tmp += truedist(Lat,x[index_r],WCentre[index_r],index_r) * RealPhiR[i0];
	1282	//tmp += sawtooth(Lat,truedist(Lat,x[index_r],WCentre[index_r],index_r), index_r)*RealPhiR[i0];
	1283	//(Fehler mit falschem Ort ist vor dieser Stelle!): ueber result = RealPhiR[i0] * (x[index_r]) * RealPhiR[i0]; gecheckt
	1284	//result += TempPsiR[i0] * PsiCR[iS];
	1285	}
	1286	UnLockDensityArray(Dens0,Temp2Density,imag); // TempPsi
	1287	//MPI_Allreduce( &result, &Result, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1288	//if (P->Par.me == 0) fprintf(stderr,"(%i) PerturbationOpertator_R: %e\n",P->Par.me, Result/LevS->MaxN);
	1289	// inverse fourier transform
	1290	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
	1291	//fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, Psi2C, workC);
	1292
	1293	// copy to destination array
	1294	for (g=0; g<LevS->MaxG; g++) {
	1295	Index = LevS->GArray[g].Index;
	1296	dest[g].re = ( PsiC[Index].re)*FFTFactor;
	1297	dest[g].im = ( PsiC[Index].im)*FFTFactor;
	1298	}
	1299	UnLockDensityArray(Dens0,ActualPsiDensity,imag); //PsiC
	1300	//if (LevS->GArray[0].GSq == 0)
	1301	// dest[0].im = 0; // imaginary of G=0 is zero
	1302	}
	1303	/*
	1304	{
	1305	struct RunStruct *R = &P->R;
	1306	struct LatticeLevel *Lev0 = R->Lev0;
	1307	struct LatticeLevel *LevS = R->LevS;
	1308	struct Lattice *Lat = &P->Lat;
	1309	struct fft_plan_3d *plan = Lat->plan;
	1310	struct Density *Dens0 = Lev0->Dens;
	1311	fftw_complex *tempdestRC = Dens0->DensityCArray[TempDensity];
	1312	fftw_real tempdestR = (fftw_real ) tempdestRC;
	1313	fftw_complex *work = Dens0->DensityCArray[Temp2Density];
	1314	fftw_complex PsiC = (fftw_complex ) Dens0->DensityCArray[ActualPsiDensity];;
	1315	fftw_real PsiCR = (fftw_real ) PsiC;
	1316	fftw_real RealPhiR = (fftw_real ) Dens0->DensityArray[Temp2Density];
	1317	fftw_complex posfac, destsnd, *destrcv;
	1318	double x[NDIM], fac[NDIM], WCentre[NDIM];
	1319	int n[NDIM], N0, n0, g, Index, pos, iS, i0;
	1320
	1321	// init pointers and values
	1322	int myPE = P->Par.me_comm_ST_Psi;
	1323	double FFTFactor = 1./LevS->MaxN;
	1324	int N[NDIM], NUp[NDIM];
	1325	N[0] = LevS->Plan0.plan->N[0];
	1326	N[1] = LevS->Plan0.plan->N[1];
	1327	N[2] = LevS->Plan0.plan->N[2];
	1328	NUp[0] = LevS->NUp[0];
	1329	NUp[1] = LevS->NUp[1];
	1330	NUp[2] = LevS->NUp[2];
	1331	N0 = LevS->Plan0.plan->local_nx;
	1332	wavenr = Lat->Psi.TypeStartIndex[Occupied] + (wavenr - Lat->Psi.TypeStartIndex[R->CurrentMin]);
	1333	Wcentre[0] = Lat->Psi.AddData[wavenr].WannierCentre[0];
	1334	Wcentre[1] = Lat->Psi.AddData[wavenr].WannierCentre[1];
	1335	Wcentre[2] = Lat->Psi.AddData[wavenr].WannierCentre[2];
	1336
	1337	// blow up source coefficients
	1338	SetArrayToDouble0((double )tempdestRC,Dens0->TotalSize2);
	1339	SetArrayToDouble0((double )RealPhiR,Dens0->TotalSize2);
	1340	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
	1341	for (g=0; g<LevS->MaxG; g++) {
	1342	Index = LevS->GArray[g].Index;
	1343	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
	1344	destrcv = &tempdestRC[LevS->MaxNUp*Index];
	1345	for (pos=0; pos<LevS->MaxNUp; pos++) {
	1346	destrcv[pos].re = (( source[g].re)posfac[pos].re-( source[g].im)posfac[pos].im);
	1347	destrcv[pos].im = (( source[g].re)posfac[pos].im+( source[g].im)posfac[pos].re);
	1348	}
	1349	}
	1350	for (g=0; g<LevS->MaxDoubleG; g++) {
	1351	destsnd = &tempdestRC[LevS->DoubleG[2g]LevS->MaxNUp];
	1352	destrcv = &tempdestRC[LevS->DoubleG[2g+1]LevS->MaxNUp];
	1353	for (pos=0; pos<LevS->MaxNUp; pos++) {
	1354	destrcv[pos].re = destsnd[pos].re;
	1355	destrcv[pos].im = -destsnd[pos].im;
	1356	}
	1357	}
	1358
	1359	// fourier transform blown up wave function
	1360	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC, work);
	1361	DensityRTransformPos(LevS,tempdestR,RealPhiR);
	1362
	1363	//fft_Psi(P,source,RealPhiR,0,0);
	1364
	1365	// for every point on the real grid multiply with component of position vector
	1366	for (n0=0; n0<N0; n0++)
	1367	for (n[1]=0; n[1]<N[1]; n[1]++)
	1368	for (n[2]=0; n[2]<N[2]; n[2]++) {
	1369	n[0] = n0 + N0 * myPE;
	1370	fac[0] = (double)(n[0])/(double)((N[0]));
	1371	fac[1] = (double)(n[1])/(double)((N[1]));
	1372	fac[2] = (double)(n[2])/(double)((N[2]));
	1373	RMat33Vec3(x,Lat->RealBasis,fac);
	1374	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
	1375	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	1376	//PsiCR[iS] = (x[index_r]) * RealPhiR[i0]; //- WCentre[index_r]
	1377	PsiCR[iS] = truedist(Lat,x[index_r],WCentre[index_r],index_r) * RealPhiR[i0];
	1378	//PsiCR[iS] = truedist(Lat,x[index_r],0.,index_r) * RealPhiR[i0];
	1379	//PsiCR[iS] = sawtooth(Lat,truedist(Lat,x[index_r],WCentre[index_r],index_r), index_r)*RealPhiR[i0];
	1380	//(Fehler mit falschem Ort ist vor dieser Stelle!): ueber result = RealPhiR[i0] * (x[index_r]) * RealPhiR[i0]; gecheckt
	1381	}
	1382
	1383	// inverse fourier transform
	1384	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, work);
	1385
	1386	// copy to destination array
	1387	for (g=0; g<LevS->MaxG; g++) {
	1388	Index = LevS->GArray[g].Index;
	1389	dest[g].re = ( PsiC[Index].re)*FFTFactor;
	1390	dest[g].im = ( PsiC[Index].im)*FFTFactor;
	1391	if (LevS->GArray[g].GSq == 0)
	1392	dest[g].im = 0; // imaginary of G=0 is zero
	1393	}
	1394	}*/
	1395
	1396	/** Prints the positions of all unperturbed orbitals to screen.
	1397	* \param *P Problem at hand
	1398	* \param type PsiTypeTag specifying group of orbitals
	1399	* \sa CalculatePerturbationOperator_R()
	1400	*/
	1401	void OutputOrbitalPositions(struct Problem *P, const enum PsiTypeTag type)
	1402	{
	1403	struct Lattice *Lat = &P->Lat;
	1404	struct Psis *Psi = &Lat->Psi;
	1405	struct RunStruct *R = &P->R;
	1406	struct LatticeLevel *LevS = R->LevS;
	1407	fftw_complex *temp = LevS->LPsi->TempPsi;
	1408	fftw_complex *source;
	1409	int wavenr, index;
	1410	double result[NDIM], Result[NDIM];
	1411	//double imsult[NDIM], Imsult[NDIM];
	1412	double norm[NDIM], Norm[NDIM];
	1413	//double imnorm[NDIM], imNorm[NDIM];
	1414	double Wcentre[NDIM];
	1415
	1416	// for every unperturbed wave function
	1417	for (wavenr=Psi->TypeStartIndex[type]; wavenr<Psi->TypeStartIndex[type+1]; wavenr++) {
	1418	source = LevS->LPsi->LocalPsi[wavenr];
	1419	Wcentre[0] = Psi->AddData[wavenr].WannierCentre[0];
	1420	Wcentre[1] = Psi->AddData[wavenr].WannierCentre[1];
	1421	Wcentre[2] = Psi->AddData[wavenr].WannierCentre[2];
	1422	for (index=0; index<NDIM; index++) {
	1423	SetArrayToDouble0((double )temp,2R->InitLevS->MaxG);
	1424	// apply position operator
	1425	CalculatePerturbationOperator_R(P,source,temp,source,index, wavenr + Psi->TypeStartIndex[R->CurrentMin]);
	1426	// take scalar product
	1427	result[index] = GradSP(P,LevS,source,temp);
	1428	//imsult[index] = GradImSP(P,LevS,source,temp);
	1429	norm[index] = GradSP(P,LevS,source,source);
	1430	//imnorm[index] = GradImSP(P,LevS,source,source);
	1431	MPI_Allreduce( result, Result, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1432	//MPI_Allreduce( imsult, Imsult, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1433	MPI_Allreduce( norm, Norm, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1434	//MPI_Allreduce( imnorm, imNorm, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	1435	}
	1436	// print output to stderr
	1437	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Position of Orbital %i: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0]+Wcentre[0], Result[1]/Norm[1]+Wcentre[1], Result[2]/Norm[2]+Wcentre[2]);
	1438	//fprintf(stderr,"(%i) Position of Orbital %i wrt Wannier: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0], Result[1]/Norm[1], Result[2]/Norm[2]);
	1439	//fprintf(stderr,"(%i) with Norm: (%e,%e,%e) + i (%e,%e,%e)\n",P->Par.me, Norm[0], Norm[1], Norm[2], imNorm[0], imNorm[1], imNorm[2]);
	1440	//if (P->Par.me == 0) fprintf(stderr,"(%i) Position of Orbital %i: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0], Result[1]/Norm[1], Result[2]/Norm[2]);
	1441	}
	1442	}
	1443
	1444	#define borderstart 0.9
	1445
	1446	/** Applies perturbation operator \f$(\widehat{r} \times \nabla)_{index}\f$ to \a *source.
	1447	* The source is fourier-transformed by transforming it to a density (on the next higher level RunStruct#Lev0)
	1448	* and at the same time multiply it with the respective component of the reciprocal G vector - the momentum. This
	1449	* is done by callinf fft_Psi(). Thus we get \f$\nabla_k \| \varphi (R) \rangle\f$.
	1450	*
	1451	* Next, we apply the two of three components of the position operator r, which ones stated by cross(), while going
	1452	* in a loop through every point of the grid. In order to do this sensibly, truedist() is used to map the coordinates
	1453	* onto -L/2...L/2, by subtracting the OneElementPsiAddData#WannierCentre R and wrapping. Also, due to the breaking up
	1454	* of the x axis into equally sized chunks for each coefficient sharing process, we need to step only over local
	1455	* x-axis grid points, however shift them to the global position when being used as position. In the end, we get
	1456	* \f$\epsilon_{index,j,k} (\widehat{r}-R)_j \nabla_k \| \varphi (R) \rangle\f$.
	1457	*
	1458	* One last fft brings the wave function back to reciprocal basis and it is copied to \a *dest.
	1459	* \param *P Problem at hand
	1460	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
	1461	* \param *dest returned complex coefficients of wave function \f$(\widehat{r} \times \widehat{p})_{index}\|\varphi(G)\rangle\f$
	1462	* \param phi0nr number within LocalPsi of the unperturbed pendant of the given perturbed wavefunction \a *source.
	1463	* \param index_rxp index desired of the vector product
	1464	* \sa CalculateConDirHConDir() - the procedure of fft and inverse fft is very similar.
	1465	*/
	1466	void CalculatePerturbationOperator_RxP(struct Problem P, const fftw_complex source, fftw_complex *dest, const int phi0nr, const int index_rxp)
	1467
	1468	{
	1469	struct Lattice *Lat = &P->Lat;
	1470	struct RunStruct *R = &P->R;
	1471	struct LatticeLevel *Lev0 = R->Lev0;
	1472	struct LatticeLevel *LevS = R->LevS;
	1473	struct Density *Dens0 = Lev0->Dens;
	1474	struct fft_plan_3d *plan = Lat->plan;
	1475	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
	1476	fftw_real TempPsiR = (fftw_real ) TempPsi;
	1477	fftw_complex TempPsi2 = (fftw_complex )Dens0->DensityArray[Temp2Density];
	1478	fftw_real TempPsi2R = (fftw_real ) TempPsi2;
	1479	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
	1480	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
	1481	fftw_real PsiCR = (fftw_real ) PsiC;
	1482	double x[NDIM], fac[NDIM], Wcentre[NDIM];
	1483	int n[NDIM], n0, g, Index, iS, i0; //pos,
	1484	int N[NDIM], NUp[NDIM];
	1485	const int N0 = LevS->Plan0.plan->local_nx;
	1486	N[0] = LevS->Plan0.plan->N[0];
	1487	N[1] = LevS->Plan0.plan->N[1];
	1488	N[2] = LevS->Plan0.plan->N[2];
	1489	NUp[0] = LevS->NUp[0];
	1490	NUp[1] = LevS->NUp[1];
	1491	NUp[2] = LevS->NUp[2];
	1492	Wcentre[0] = Lat->Psi.AddData[phi0nr].WannierCentre[0];
	1493	Wcentre[1] = Lat->Psi.AddData[phi0nr].WannierCentre[1];
	1494	Wcentre[2] = Lat->Psi.AddData[phi0nr].WannierCentre[2];
	1495	// init pointers and values
	1496	const int myPE = P->Par.me_comm_ST_Psi;
	1497	const double FFTFactor = 1./LevS->MaxN; //
	1498	// double max[NDIM], max_psi[NDIM];
	1499	// double max_n[NDIM];
	1500	int index[4];
	1501	// double smooth, wall[NDIM];
	1502	// for (g=0;g<NDIM;g++) {
	1503	// max[g] = 0.;
	1504	// max_psi[g] = 0.;
	1505	// max_n[g] = -1.;
	1506	// }
	1507
	1508	//fprintf(stderr,"(%i) Wannier[%i] (%2.13e, %2.13e, %2.13e)\n", P->Par.me, phi0nr, 10.-Wcentre[0], 10.-Wcentre[1], 10.-Wcentre[2]);
	1509	for (g=0;g<4;g++)
	1510	index[g] = cross(index_rxp,g);
	1511
	1512	// blow up source coefficients
	1513	LockDensityArray(Dens0,Temp2Density,imag); // TempPsi
	1514	LockDensityArray(Dens0,Temp2Density,real); // TempPsi2
	1515	LockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
	1516
	1517	fft_Psi(P,source,TempPsiR ,index[1],7);
	1518	fft_Psi(P,source,TempPsi2R,index[3],7);
	1519
	1520	//result = 0.;
	1521	// for every point on the real grid multiply with component of position vector
	1522	for (n0=0; n0<N0; n0++)
	1523	for (n[1]=0; n[1]<N[1]; n[1]++)
	1524	for (n[2]=0; n[2]<N[2]; n[2]++) {
	1525	n[0] = n0 + N0 * myPE;
	1526	fac[0] = (double)(n[0])/(double)((N[0]));
	1527	fac[1] = (double)(n[1])/(double)((N[1]));
	1528	fac[2] = (double)(n[2])/(double)((N[2]));
	1529	RMat33Vec3(x,Lat->RealBasis,fac);
	1530	// fac[0] = (fac[0] > .9) ? fac[0]-0.9 : 0.;
	1531	// fac[1] = (fac[1] > .9) ? fac[1]-0.9 : 0.;
	1532	// fac[2] = (fac[2] > .9) ? fac[2]-0.9 : 0.;
	1533	// RMat33Vec3(wall,Lat->RealBasis,fac);
	1534	// smooth = exp(wall[0]wall[0]+wall[1]wall[1]+wall[2]*wall[2]); // smoothing near the borders of the virtual cell
	1535	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
	1536	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	1537
[f5586e]	1538	// if (fabs(truedist(Lat,x[index[1]],Wcentre[index[1]],index[1])) >= borderstart * sqrt(Lat->RealBasisSQ[index[1]])/2.)
[a0bcf1]	1539	// if (max[index[1]] < sawtooth(Lat,truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]),index[1]) * TempPsiR [i0]) {
	1540	// max[index[1]] = sawtooth(Lat,truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]),index[1]) * TempPsiR [i0];
	1541	// max_psi[index[1]] = TempPsiR [i0];
	1542	// max_n[index[1]] = truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]);
	1543	// }
	1544	//
[f5586e]	1545	// if (fabs(truedist(Lat,x[index[3]],Wcentre[index[3]],index[3])) >= borderstart * sqrt(Lat->RealBasisSQ[index[3]])/2.)
[a0bcf1]	1546	// if (max[index[3]] < sawtooth(Lat,truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]),index[3]) * TempPsiR [i0]) {
	1547	// max[index[3]] = sawtooth(Lat,truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]),index[3]) * TempPsiR [i0];
	1548	// max_psi[index[3]] = TempPsiR [i0];
	1549	// max_n[index[3]] = truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]);
	1550	// }
	1551
	1552	PsiCR[iS] = //vector * TempPsiR[i0];
	1553	sawtooth(Lat,MinImageConv(Lat,x[index[0]],Wcentre[index[0]],index[0]),index[0]) * TempPsiR [i0]
	1554	-sawtooth(Lat,MinImageConv(Lat,x[index[2]],Wcentre[index[2]],index[2]),index[2]) * TempPsi2R[i0];
	1555	// ShiftGaugeOrigin(P,truedist(Lat,x[index[0]],Wcentre[index[0]],index[0]),index[0]) * TempPsiR [i0]
	1556	// -ShiftGaugeOrigin(P,truedist(Lat,x[index[2]],Wcentre[index[2]],index[2]),index[2]) * TempPsi2R[i0];
	1557	// PsiCR[iS] = (x[index[0]] - Wcentre[index[0]]) * TempPsiR [i0] - (x[index[2]] - Wcentre[index[2]]) * TempPsi2R[i0];
	1558	}
	1559	//if (P->Par.me == 0) fprintf(stderr,"(%i) PerturbationOpertator_R(xP): %e\n",P->Par.me, Result/LevS->MaxN);
	1560	UnLockDensityArray(Dens0,Temp2Density,imag); // TempPsi
	1561	UnLockDensityArray(Dens0,Temp2Density,real); // TempPsi2
	1562
	1563	// // print maximum values
	1564	// fprintf (stderr,"(%i) RxP: Maximum values = (",P->Par.me);
	1565	// for (g=0;g<NDIM;g++)
	1566	// fprintf(stderr,"%lg\t", max[g]);
	1567	// fprintf(stderr,"\b)\t(");
	1568	// for (g=0;g<NDIM;g++)
	1569	// fprintf(stderr,"%lg\t", max_psi[g]);
	1570	// fprintf(stderr,"\b)\t");
	1571	// fprintf (stderr,"at (");
	1572	// for (g=0;g<NDIM;g++)
	1573	// fprintf(stderr,"%lg\t", max_n[g]);
	1574	// fprintf(stderr,"\b)\n");
	1575
	1576	// inverse fourier transform
	1577	//if (PsiC != Dens0->DensityCArray[ActualPsiDensity]) Error(SomeError,"CalculatePerturbationOperator_RxP: PsiC corrupted");
	1578	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
	1579
	1580	// copy to destination array
	1581	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
	1582	for (g=0; g<LevS->MaxG; g++) {
	1583	Index = LevS->GArray[g].Index;
	1584	dest[g].re += ( PsiC[Index].re)*FFTFactor; // factor confirmed, see grad.c:CalculateConDirHConDir()
	1585	dest[g].im += ( PsiC[Index].im)*FFTFactor;
	1586	//fprintf(stderr,"(%i) PsiC[(%lg,%lg,%lg)] = %lg +i %lg\n", P->Par.me, LevS->GArray[g].G[0], LevS->GArray[g].G[1], LevS->GArray[g].G[2], dest[g].re, dest[g].im);
	1587	}
	1588	UnLockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
	1589	//if (LevS->GArray[0].GSq == 0.)
	1590	//dest[0].im = 0.; // don't do this, see ..._P()
	1591	}
	1592
	1593	/** Applies perturbation operator \f$-(\nabla \times \widehat{r})_{index}\f$ to \a *source.
	1594	* Is analogous to CalculatePerturbationOperator_RxP(), only the order is reversed, first position operator, then
	1595	* momentum operator
	1596	* \param *P Problem at hand
	1597	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
	1598	* \param *dest returned complex coefficients of wave function \f$(\widehat{r} \times \widehat{p})_{index}\|\varphi(G)\rangle\f$
	1599	* \param phi0nr number within LocalPsi of the unperturbed pendant of the given perturbed wavefunction \a *source.
	1600	* \param index_pxr index of position operator
	1601	* \note Only third component is important due to initial rotiation of cell such that B field is aligned with z axis.
	1602	* \sa CalculateConDirHConDir() - the procedure of fft and inverse fft is very similar.
	1603	* \bug routine is not tested (but should work), as it offers no advantage over CalculatePerturbationOperator_RxP()
	1604	*/
	1605	void CalculatePerturbationOperator_PxR(struct Problem P, const fftw_complex source, fftw_complex *dest, const int phi0nr, const int index_pxr)
	1606
	1607	{
	1608	struct Lattice *Lat = &P->Lat;
	1609	struct RunStruct *R = &P->R;
	1610	struct LatticeLevel *Lev0 = R->Lev0;
	1611	struct LatticeLevel *LevS = R->LevS;
	1612	struct Density *Dens0 = Lev0->Dens;
	1613	struct fft_plan_3d *plan = Lat->plan;
	1614	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
	1615	fftw_real TempPsiR = (fftw_real ) TempPsi;
	1616	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
	1617	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
	1618	fftw_real PsiCR = (fftw_real ) PsiC;
	1619	fftw_complex *Psi2C = Dens0->DensityCArray[ActualDensity];
	1620	fftw_real Psi2CR = (fftw_real ) Psi2C;
	1621	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[Temp2Density];
	1622	fftw_complex posfac, destsnd, *destrcv;
	1623	double x[NDIM], fac[NDIM], Wcentre[NDIM];
	1624	int n[NDIM], n0, g, Index, pos, iS, i0;
	1625	int N[NDIM], NUp[NDIM];
	1626	const int N0 = LevS->Plan0.plan->local_nx;
	1627	N[0] = LevS->Plan0.plan->N[0];
	1628	N[1] = LevS->Plan0.plan->N[1];
	1629	N[2] = LevS->Plan0.plan->N[2];
	1630	NUp[0] = LevS->NUp[0];
	1631	NUp[1] = LevS->NUp[1];
	1632	NUp[2] = LevS->NUp[2];
	1633	Wcentre[0] = Lat->Psi.AddData[phi0nr].WannierCentre[0];
	1634	Wcentre[1] = Lat->Psi.AddData[phi0nr].WannierCentre[1];
	1635	Wcentre[2] = Lat->Psi.AddData[phi0nr].WannierCentre[2];
	1636	// init pointers and values
	1637	const int myPE = P->Par.me_comm_ST_Psi;
	1638	const double FFTFactor = 1./LevS->MaxN;
	1639
	1640	// blow up source coefficients
	1641	SetArrayToDouble0((double )tempdestRC ,Dens0->TotalSize2);
	1642	SetArrayToDouble0((double )TempPsi ,Dens0->TotalSize2);
	1643	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
	1644	SetArrayToDouble0((double )Psi2C,Dens0->TotalSize2);
	1645	for (g=0; g<LevS->MaxG; g++) {
	1646	Index = LevS->GArray[g].Index;
	1647	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
	1648	destrcv = &tempdestRC[LevS->MaxNUp*Index];
	1649	for (pos=0; pos < LevS->MaxNUp; pos++) {
	1650	destrcv [pos].re = (( source[g].re)posfac[pos].re-( source[g].im)posfac[pos].im);
	1651	destrcv [pos].im = (( source[g].re)posfac[pos].im+( source[g].im)posfac[pos].re);
	1652	}
	1653	}
	1654	for (g=0; g<LevS->MaxDoubleG; g++) {
	1655	destsnd = &tempdestRC [LevS->DoubleG[2g]LevS->MaxNUp];
	1656	destrcv = &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp];
	1657	for (pos=0; pos<LevS->MaxNUp; pos++) {
	1658	destrcv [pos].re = destsnd [pos].re;
	1659	destrcv [pos].im = -destsnd [pos].im;
	1660	}
	1661	}
	1662	// fourier transform blown up wave function
	1663	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC , workC);
	1664	DensityRTransformPos(LevS,(fftw_real*)tempdestRC ,TempPsiR );
	1665
	1666	//fft_Psi(P,source,TempPsiR ,cross(index_pxr,1),7);
	1667	//fft_Psi(P,source,TempPsi2R,cross(index_pxr,3),7);
	1668
	1669	//result = 0.;
	1670	// for every point on the real grid multiply with component of position vector
	1671	for (n0=0; n0<N0; n0++)
	1672	for (n[1]=0; n[1]<N[1]; n[1]++)
	1673	for (n[2]=0; n[2]<N[2]; n[2]++) {
	1674	n[0] = n0 + N0 * myPE;
	1675	fac[0] = (double)(n[0])/(double)((N[0]));
	1676	fac[1] = (double)(n[1])/(double)((N[1]));
	1677	fac[2] = (double)(n[2])/(double)((N[2]));
	1678	RMat33Vec3(x,Lat->RealBasis,fac);
	1679	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
	1680	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	1681	// PsiCR[iS] = sawtooth(Lat,truedist(Lat,x[cross(index_pxr,1)],Wcentre[cross(index_pxr,1)],cross(index_pxr,1)),cross(index_pxr,1)) * TempPsiR[i0];
	1682	// Psi2CR[iS] = sawtooth(Lat,truedist(Lat,x[cross(index_pxr,3)],Wcentre[cross(index_pxr,3)],cross(index_pxr,3)),cross(index_pxr,3)) * TempPsiR[i0];
	1683	PsiCR[iS] = ShiftGaugeOrigin(P,MinImageConv(Lat,x[cross(index_pxr,1)],Wcentre[cross(index_pxr,1)],cross(index_pxr,1)),cross(index_pxr,1)) * TempPsiR[i0];
	1684	Psi2CR[iS] = ShiftGaugeOrigin(P,MinImageConv(Lat,x[cross(index_pxr,3)],Wcentre[cross(index_pxr,3)],cross(index_pxr,3)),cross(index_pxr,3)) * TempPsiR[i0];
	1685	}
	1686
	1687	// inverse fourier transform
	1688	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
	1689	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, Psi2C, workC);
	1690
	1691	// copy to destination array
	1692	for (g=0; g<LevS->MaxG; g++) {
	1693	Index = LevS->GArray[g].Index;
	1694	dest[g].re = -LevS->GArray[g].G[cross(index_pxr,0)]( PsiC[Index].im)FFTFactor;
	1695	dest[g].im = -LevS->GArray[g].G[cross(index_pxr,0)](-PsiC[Index].re)FFTFactor;
	1696	dest[g].re -= -LevS->GArray[g].G[cross(index_pxr,2)]( Psi2C[Index].im)FFTFactor;
	1697	dest[g].im -= -LevS->GArray[g].G[cross(index_pxr,2)](-Psi2C[Index].re)FFTFactor;
	1698	}
	1699	if (LevS->GArray[0].GSq == 0.)
	1700	dest[0].im = 0.; // don't do this, see ..._P()
	1701	}
	1702
	1703	/** Evaluates first derivative of perturbed energy functional with respect to minimisation parameter \f$\Theta\f$.
	1704	* \f[
	1705	* \frac{\delta {\cal E}^{(2)}} {\delta \Theta} =
	1706	* 2 {\cal R} \langle \widetilde{\varphi}_i^{(1)} \| {\cal H}^{(0)} \| \varphi_i^{(1)} \rangle
	1707	* - \sum_l \lambda_{il} \langle \widetilde{\varphi}_i^{(1)} \| \varphi_l^{(1)} \rangle
	1708	* - \sum_k \lambda_{ki} \langle \varphi_k^{(1)} \| \widetilde{\varphi}_i^{(1)} \rangle
	1709	* + 2 {\cal R} \langle \widetilde{\varphi}_i^{(1)} \| {\cal H}^{(1)} \| \varphi_i^{(0)} \rangle
	1710	* \f]
	1711	*
	1712	* The summation over all Psis has again to be done with an MPI exchange of non-local coefficients, as the conjugate
	1713	* directions are not the same in situations where PePGamma > 1 (Psis split up among processes = multiple minimisation)
	1714	* \param *P Problem at hand
	1715	* \param source0 unperturbed wave function \f$\varphi_l^{(0)}\f$
	1716	* \param source perturbed wave function \f$\varphi_l^{(1)} (G)\f$
	1717	* \param ConDir normalized conjugate direction \f$\widetilde{\varphi}_l^{(1)} (G)\f$
	1718	* \param Hc_grad complex coefficients of \f$H^{(0)} \| \varphi_l^{(1)} (G) \rangle\f$, see GradientArray#HcGradient
	1719	* \param H1c_grad complex coefficients of \f$H^{(1)} \| \varphi_l^{(0)} (G) \rangle\f$, see GradientArray#H1cGradient
	1720	* \sa CalculateLineSearch() - used there, \sa CalculateConDirHConDir() - same principles
	1721	* \warning The MPI_Allreduce for the scalar product in the end has not been done and must not have been done for given
	1722	* parameters yet!
	1723	*/
	1724	double Calculate1stPerturbedDerivative(struct Problem P, const fftw_complex source0, const fftw_complex source, const fftw_complex ConDir, const fftw_complex Hc_grad, const fftw_complex H1c_grad)
	1725	{
	1726	struct RunStruct *R = &P->R;
	1727	struct Psis *Psi = &P->Lat.Psi;
	1728	struct LatticeLevel *LevS = R->LevS;
	1729	double result = 0., E0 = 0., Elambda = 0., E1 = 0.;//, E2 = 0.;
	1730	int i,m,j;
	1731	const int state = R->CurrentMin;
	1732	//const int l_normal = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
	1733	const int ActNum = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[R->ActualLocalPsiNo].my_color_comm_ST_Psi;
	1734	//int l = R->ActualLocalPsiNo;
	1735	//int l_normal = Psi->TypeStartIndex[Occupied] + (l - Psi->TypeStartIndex[state]); // offset l to \varphi_l^{(0)}
	1736	struct OnePsiElement OnePsiB, LOnePsiB;
	1737	//fftw_complex *HConGrad = LevS->LPsi->TempPsi;
	1738	fftw_complex *LPsiDatB=NULL;
	1739	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
	1740	int RecvSource;
	1741	MPI_Status status;
	1742
	1743	//CalculateCDfnl(P,ConDir,PP->CDfnl);
	1744	//ApplyTotalHamiltonian(P,ConDir,HConDir, PP->CDfnl, 1, 0);
	1745	//E0 = (GradSP(P, LevS, ConDir, Hc_grad) + GradSP(P, LevS, source, HConDir)) * Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
	1746	E0 = 2.GradSP(P, LevS, ConDir, Hc_grad) Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
	1747	result = E0;
	1748	//fprintf(stderr,"(%i) 1st: E0 = \t\t%lg\n", P->Par.me, E0);
	1749
	1750	m = -1;
	1751	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
	1752	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
	1753	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
	1754	m++; // increase m if it is type-specific wave function
	1755	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
	1756	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
	1757	else
	1758	LOnePsiB = NULL;
	1759	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
	1760	RecvSource = OnePsiB->my_color_comm_ST_Psi;
	1761	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, PerturbedTag, P->Par.comm_ST_PsiT, &status );
	1762	LPsiDatB=LevS->LPsi->TempPsi;
	1763	} else { // .. otherwise send it to all other processes (Max_me... - 1)
	1764	for (i=0;i<P->Par.Max_me_comm_ST_PsiT;i++)
	1765	if (i != OnePsiB->my_color_comm_ST_Psi)
	1766	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, i, PerturbedTag, P->Par.comm_ST_PsiT);
	1767	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
	1768	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
	1769
	1770	Elambda -= 2.Psi->lambda[ActNum][m]GradSP(P, LevS, ConDir, LPsiDatB) * OnePsiB->PsiFactor; // lambda is symmetric
	1771	}
	1772	}
	1773	result += Elambda;
	1774	//fprintf(stderr,"(%i) 1st: Elambda = \t%lg\n", P->Par.me, Elambda);
	1775
	1776	E1 = 2.GradSP(P,LevS,ConDir,H1c_grad) sqrt(Psi->AllPsiStatus[ActNum].PsiFactor*Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor);
	1777	result += E1;
	1778	//fprintf(stderr,"(%i) 1st: E1 = \t\t%lg\n", P->Par.me, E1);
	1779
	1780	return result;
	1781	}
	1782
	1783
	1784	/** Evaluates second derivative of perturbed energy functional with respect to minimisation parameter \f$\Theta\f$.
	1785	* \f[
	1786	* \frac{\delta^2 {\cal E}^{(2)}} {\delta \Theta^2} =
	1787	* 2 \bigl( \langle \widetilde{\varphi}_l^{(1)} \| {\cal H}^{(0)} \| \widetilde{\varphi}_l^{(1)} \rangle
	1788	* - \langle \varphi_l^{(1)} \| {\cal H}^{(0)} \| \varphi_l^{(1)} \rangle \bigr )
	1789	* + 2 \sum_{i,i \neq l } \lambda_{il} \langle \varphi_i^{(1)} \| \varphi_l^{(1)} \rangle
	1790	* - 2 {\cal R} \langle \varphi_l^{(1)} \| {\cal H}^{(1)} \| \varphi_l^{(0)} \rangle
	1791	* \f]
	1792	*
	1793	* The energy eigenvalues of \a ConDir and \a source must be supplied, they can be calculated via CalculateConDirHConDir() and/or
	1794	* by the due to CalculatePerturbedEnergy() already present OnePsiElementAddData#Lambda eigenvalue. The summation over the
	1795	* unperturbed lambda within the scalar product of perturbed wave functions is evaluated with Psis#lambda and Psis#Overlap.
	1796	* Afterwards, the ConDir density is calculated and also the i-th perturbed density to first degree. With these in a sum over
	1797	* all real mesh points the exchange-correlation first and second derivatives and also the Hartree potential ones can be calculated
	1798	* and summed up.
	1799	* \param *P Problem at hand
	1800	* \param source0 unperturbed wave function \f$\varphi_l^{(0)}\f$
	1801	* \param source wave function \f$\varphi_l^{(1)}\f$
	1802	* \param ConDir conjugated direction \f$\widetilde{\varphi}_l^{(1)}\f$
	1803	* \param sourceHsource eigenvalue of wave function \f$\langle \varphi_l^{(1)} \| H^{(0)} \| \varphi_l^{(1)}\rangle\f$
	1804	* \param ConDirHConDir perturbed eigenvalue of conjugate direction \f$\langle \widetilde{\varphi}_l^{(1)} \| H^{(0)} \| \widetilde{\varphi}_l^{(1)}\rangle\f$
	1805	* \param ConDirConDir norm of conjugate direction \f$\langle \widetilde{\varphi}_l^{(1)} \| \widetilde{\varphi}_l^{(1)}\rangle\f$
	1806	* \warning No MPI_AllReduce() takes place, parameters have to be reduced already.
	1807	*/
	1808	double Calculate2ndPerturbedDerivative(struct Problem P, const fftw_complex source0,const fftw_complex source, const fftw_complex ConDir,const double sourceHsource, const double ConDirHConDir, const double ConDirConDir)
	1809	{
	1810	struct RunStruct *R = &P->R;
	1811	struct Psis *Psi = &P->Lat.Psi;
	1812	//struct Lattice *Lat = &P->Lat;
	1813	//struct Energy *E = Lat->E;
	1814	double result = 0.;
	1815	double Con0 = 0., Elambda = 0.;//, E0 = 0., E1 = 0.;
	1816	//int i;
	1817	const int state = R->CurrentMin;
	1818	//const int l_normal = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
	1819	const int ActNum = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[R->ActualLocalPsiNo].my_color_comm_ST_Psi;
	1820
	1821	Con0 = 2.*ConDirHConDir;
	1822	result += Con0;
	1823	////E0 = -2.*sourceHsource;
	1824	////result += E0;
	1825	////E1 = -E->PsiEnergy[Perturbed1_0Energy][R->ActualLocalPsiNo] - E->PsiEnergy[Perturbed0_1Energy][R->ActualLocalPsiNo];
	1826	////result += E1;
	1827	//fprintf(stderr,"(%i) 2nd: E1 = \t%lg\n", P->Par.me, E1);
	1828
	1829	////for (i=0;i<Lat->Psi.NoOfPsis;i++) {
	1830	//// if (i != ActNum) Elambda += Psi->lambda[i][ActNum]Psi->Overlap[i][ActNum]+ Psi->lambda[ActNum][i]Psi->Overlap[ActNum][i]; // overlap contains PsiFactor
	1831	////}
	1832	////Elambda = Psi->lambda[ActNum][ActNum]*Psi->Overlap[ActNum][ActNum];
	1833	Elambda = 2.Psi->lambda[ActNum][ActNum]ConDirConDir;
	1834	result -= Elambda;
	1835
	1836	//fprintf(stderr,"(%i) 2ndPerturbedDerivative: Result = Con0 + E0 + E1 + Elambda + dEdt0_XC + ddEddt0_XC + dEdt0_H + ddEddt0_H = %lg + %lg + %lg + %lg + %lg + %lg + %lg + %lg = %lg\n", P->Par.me, Con0, E0, E1, Elambda, VolumeFactorRdEdt0_XC, VolumeFactorRddEddt0_XC, dEdt0_H, ddEddt0_H, result);
	1837
	1838	return (result);
	1839	}
	1840
	1841	/** Returns index of specific component in 3x3 cross product.
	1842	* \param i vector product component index, ranging from 0..NDIM
	1843	* \param j index specifies which one of the four vectors in xy - yx, ranging from 0..3 (0,1 positive sign, 2,3 negative sign)
	1844	* \return Component 0..2 of vector to be taken to evaluate a vector product
	1845	* \sa crossed() - is the same but vice versa, return value must be specified, \a i is returned.
	1846	*/
	1847	inline int cross(int i, int j)
	1848	{
	1849	const int matrix[NDIM*4] = {1,2,2,1,2,0,0,2,0,1,1,0};
	1850	if (i>=0 && i<NDIM && j>=0 && j<4)
	1851	return (matrix[i*4+j]);
	1852	else {
	1853	Error(SomeError,"cross: i or j out of range!");
	1854	return (0);
	1855	}
	1856	}
	1857
	1858	/** Returns index of resulting vector component in 3x3 cross product.
	1859	* In the column specified by the \a j index \a i is looked for and the found row index returned.
	1860	* \param i vector component index, ranging from 0..NDIM
	1861	* \param j index specifies which one of the four vectors in xy - yx, ranging from 0..3 (0,1 positive sign, 2,3 negative sign)
	1862	* \return Component 0..2 of resulting vector
	1863	* \sa cross() - is the same but vice versa, return value must be specified, \a i is returned.
	1864	*/
	1865	inline int crossed(int i, int j)
	1866	{
	1867	const int matrix[NDIM*4] = {1,2,2,1,2,0,0,2,0,1,1,0};
	1868	int k;
	1869	if (i>=0 && i<NDIM && j>=0 && j<4) {
	1870	for (k=0;k<NDIM;k++)
	1871	if (matrix[4*k+j] == i) return(k);
	1872	Error(SomeError,"crossed: given component not found!");
	1873	return(-1);
	1874	} else {
	1875	Error(SomeError,"crossed: i or j out of range!");
	1876	return (-1);
	1877	}
	1878	}
	1879
	1880	#define Nsin 16 //!< should be dependent on MaxG/MaxN per axis!
	1881
	1882	/** Returns sawtooth shaped profile for position operator within cell.
[f5586e]	1883	* This is a mapping from -L/2...L/2 (L = length of unit cell derived from Lattice#RealBasisSQ) to -L/2 to L/2 with a smooth transition:
[a0bcf1]	1884	* \f[
	1885	* f(x): x \rightarrow \left \{
	1886	* \begin{array}{l}
	1887	* -\frac{L}{2} \cdot \sin \left ( \frac{x}{0,05\cdot L} \cdot \frac{\pi}{2} \right ), 0<x<0,05\cdot L \\
	1888	* (x - 0,05\cdot L) \cdot \frac{10}{9} - \frac{L}{2}, 0,05\cdot L \leq x<0,95\cdot L \\
	1889	* \frac{L}{2} \cdot \cos \left ( \frac{x-0,95\cdot L}{0,05\cdot L} \cdot \frac{\pi}{2} \right), 0,95\cdot L<x<L
	1890	* \end{array} \right \}
	1891	* \f]
[f5586e]	1892	* \param *Lat pointer to Lattice structure for Lattice#RealBasisSQ
[a0bcf1]	1893	* \param L parameter x
[f5586e]	1894	* \param index component index for Lattice#RealBasisSQ
[a0bcf1]	1895	*/
	1896	inline double sawtooth(struct Lattice *Lat, double L, const int index)
	1897	{
[f5586e]	1898	double axis = sqrt(Lat->RealBasisSQ[index]);
[a0bcf1]	1899	double sawstart = Lat->SawtoothStart;
	1900	double sawend = 1. - sawstart;
	1901	double sawfactor = (sawstart+sawend)/(sawend-sawstart);
	1902	//return(L);
	1903
	1904	//fprintf(stderr, "sawstart: %e\tsawend: %e\tsawfactor: %e\tL: %e\n", sawstart, sawend, sawfactor, L);
	1905	// transform and return (sawtooth profile checked, 04.08.06)
	1906	L += axis/2.; // transform to 0 ... L
	1907	if (L < (sawstartaxis)) return (-axis/(2sawfactor)sin(L/(sawstartaxis)*PI/2.)); // first smooth transition from 0 ... -L/2
	1908	if (L > (sawendaxis)) return ( axis/(2sawfactor)cos((L-sawendaxis)/(sawstartaxis)PI/2.)); // second smooth transition from +L/2 ... 0
	1909	//fprintf(stderr,"L %e\t sawstart %e\t sawend %e\t sawfactor %e\t axis%e\n", L, sawstart, sawend, sawfactor, axis);
	1910	//return ((L - sawstartaxis) - axis/(2sawfactor)); // area in between scale to -L/2 ... +L/2
	1911	return (L - axis/2); // area in between return as it was
	1912	}
	1913
	1914	/** Shifts the origin of the gauge according to the CSDGT method.
	1915	* \f[
	1916	* d(r) = r - \sum_{I_s,I_a} (r-R_{I_s,I_a}) exp{(-\alpha_{I_s,I_a}(r-R_{I_s,I_a})^4)}
	1917	* \f]
	1918	* This trafo is necessary as the current otherweise (CSGT) sensitively depends on the current around
	1919	* the core region inadequately/only moderately well approximated by a plane-wave-pseudo-potential-method.
	1920	* \param *P Problem at hand, containing Lattice and Ions
	1921	* \param r parameter r
	1922	* \param index index of the basis vector
	1923	* \return \f$d(r)\f$
	1924	* \note Continuous Set of Damped Gauge Transformations according to Keith and Bader
	1925	*/
	1926	inline double ShiftGaugeOrigin(struct Problem *P, double r, const int index)
	1927	{
	1928	struct Ions *I = &P->Ion;
	1929	struct Lattice *Lat = &P->Lat;
	1930	double x, tmp;
	1931	int is,ia;
	1932
	1933	// loop over all ions to calculate the sum
	1934	x = r;
	1935	for (is=0; is < I->Max_Types; is++)
	1936	for (ia=0; ia < I->I[is].Max_IonsOfType; ia++) {
	1937	tmp = (r - I->I[is].R[NDIM*ia]);
	1938	x -= tmpexp(- I->I[is].alpha[ia] tpow(tmp,4));
	1939	}
	1940
	1941	return(sawtooth(Lat,x,index)); // still use sawtooth due to the numerical instability around the border region of the cell
	1942	}
	1943
	1944	/** Print sawtooth() for each node along one axis.
	1945	* \param *P Problem at hand, containing RunStruct, Lattice and LatticeLevel RunStruct#LevS
	1946	* \param index index of axis
	1947	*/
	1948	void TestSawtooth(struct Problem *P, const int index)
	1949	{
	1950	struct RunStruct *R = &P->R;
	1951	struct LatticeLevel *LevS = R->LevS;
	1952	struct Lattice *Lat =&P->Lat;
	1953	double x;
	1954	int n;
	1955	int N[NDIM];
	1956	N[0] = LevS->Plan0.plan->N[0];
	1957	N[1] = LevS->Plan0.plan->N[1];
	1958	N[2] = LevS->Plan0.plan->N[2];
	1959
	1960	for (n=0;n<N[index];n++) {
[f5586e]	1961	x = (double)n/(double)N[index] * sqrt(Lat->RealBasisSQ[index]);
	1962	//fprintf(stderr,"(%i) x %e\t Axis/2 %e\n",P->Par.me, x, sqrt(Lat->RealBasisSQ[index])/2. );
	1963	x = MinImageConv(Lat, x, sqrt(Lat->RealBasisSQ[index])/2., index);
[a0bcf1]	1964	fprintf(stderr,"%e\t%e\n", x, sawtooth(Lat,x,index));
	1965	}
	1966	}
	1967
	1968	/** Secures minimum image convention between two given points \a R[] and \a r[] within periodic boundary.
	1969	* Each distance component within a periodic boundary must always be between -L/2 ... L/2
	1970	* \param *Lat pointer to Lattice structure
	1971	* \param R[] first vector, NDIM, each must be between 0...L
	1972	* \param r[] second vector, NDIM, each must be between 0...L
	1973	* \param index of component
	1974	* \return component between -L/2 ... L/2
	1975	*/
	1976	inline double MinImageConv(struct Lattice *Lat, const double R, const double r, const int index)
	1977	{
[f5586e]	1978	double axis = sqrt(Lat->RealBasisSQ[index]);
[a0bcf1]	1979	double result = 0.;
	1980
	1981	if (fabs(result = R - r + axis) < axis/2.) { }
	1982	else if (fabs(result = R - r) <= axis/2.) { }
	1983	else if (fabs(result = R - r - axis) < axis/2.) { }
	1984	else Error(SomeError, "MinImageConv: None of the three cases applied!");
	1985	return (result);
	1986	}
	1987
	1988
	1989	/** Fouriertransforms given \a source.
	1990	* By the use of the symmetry parameter an additional imaginary unit and/or the momentum operator can
	1991	* be applied at the same time.
	1992	* \param *P Problem at hand
	1993	* \param *Psi source array of reciprocal coefficients
	1994	* \param *PsiR destination array, becoming filled with real coefficients
	1995	* \param index_g component of G vector (only needed for symmetry=4..7)
	1996	* \param symmetry 0 - do nothing, 1 - factor by "-1", 2 - factor by "i", 3 - factor by "1/i = -i", from 4 to 7 the same
	1997	* but additionally with momentum operator
	1998	*/
	1999	void fft_Psi(struct Problem P, const fftw_complex Psi, fftw_real *PsiR, const int index_g, const int symmetry)
	2000	{
	2001	struct Lattice *Lat = &P->Lat;
	2002	struct RunStruct *R = &P->R;
	2003	struct LatticeLevel *Lev0 = R->Lev0;
	2004	struct LatticeLevel *LevS = R->LevS;
	2005	struct Density *Dens0 = Lev0->Dens;
	2006	struct fft_plan_3d *plan = Lat->plan;
	2007	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[TempDensity];
	2008	fftw_complex *work = Dens0->DensityCArray[TempDensity];
	2009	fftw_complex posfac, destpos, destRCS, destRCD;
	2010	int i, Index, pos;
	2011
	2012	LockDensityArray(Dens0,TempDensity,imag); // tempdestRC
	2013	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
	2014	SetArrayToDouble0((double )PsiR, Dens0->TotalSize2);
	2015	switch (symmetry) {
	2016	case 0:
	2017	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
	2018	Index = LevS->GArray[i].Index;
	2019	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2020	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2021	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2022	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2023	destpos[pos].re = (Psi[i].re)posfac[pos].re-(Psi[i].im)posfac[pos].im;
	2024	destpos[pos].im = (Psi[i].re)posfac[pos].im+(Psi[i].im)posfac[pos].re;
	2025	}
	2026	}
	2027	break;
	2028	case 1:
	2029	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is - positive
	2030	Index = LevS->GArray[i].Index;
	2031	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2032	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2033	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2034	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2035	destpos[pos].re = -((Psi[i].re)posfac[pos].re-(Psi[i].im)posfac[pos].im);
	2036	destpos[pos].im = -((Psi[i].re)posfac[pos].im+(Psi[i].im)posfac[pos].re);
	2037	}
	2038	}
	2039	break;
	2040	case 2:
	2041	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is negative
	2042	Index = LevS->GArray[i].Index;
	2043	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2044	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2045	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2046	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2047	destpos[pos].re = (-Psi[i].im)posfac[pos].re-(Psi[i].re)posfac[pos].im;
	2048	destpos[pos].im = (-Psi[i].im)posfac[pos].im+(Psi[i].re)posfac[pos].re;
	2049	}
	2050	}
	2051	break;
	2052	case 3:
	2053	for (i=0;i<LevS->MaxG;i++) { // incoming is negative, outgoing is positive
	2054	Index = LevS->GArray[i].Index;
	2055	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2056	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2057	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2058	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2059	destpos[pos].re = (Psi[i].im)posfac[pos].re-(-Psi[i].re)posfac[pos].im;
	2060	destpos[pos].im = (Psi[i].im)posfac[pos].im+(-Psi[i].re)posfac[pos].re;
	2061	}
	2062	}
	2063	break;
	2064	case 4:
	2065	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
	2066	Index = LevS->GArray[i].Index;
	2067	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2068	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2069	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2070	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2071	destpos[pos].re = LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].re-(Psi[i].im)*posfac[pos].im);
	2072	destpos[pos].im = LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].im+(Psi[i].im)*posfac[pos].re);
	2073	}
	2074	}
	2075	break;
	2076	case 5:
	2077	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is - positive
	2078	Index = LevS->GArray[i].Index;
	2079	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2080	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2081	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2082	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2083	destpos[pos].re = -LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].re-(Psi[i].im)*posfac[pos].im);
	2084	destpos[pos].im = -LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].im+(Psi[i].im)*posfac[pos].re);
	2085	}
	2086	}
	2087	break;
	2088	case 6:
	2089	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is negative
	2090	Index = LevS->GArray[i].Index;
	2091	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2092	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2093	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2094	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2095	destpos[pos].re = LevS->GArray[i].G[index_g]((-Psi[i].im)posfac[pos].re-(Psi[i].re)*posfac[pos].im);
	2096	destpos[pos].im = LevS->GArray[i].G[index_g]((-Psi[i].im)posfac[pos].im+(Psi[i].re)*posfac[pos].re);
	2097	}
	2098	}
	2099	break;
	2100	case 7:
	2101	for (i=0;i<LevS->MaxG;i++) { // incoming is negative, outgoing is positive
	2102	Index = LevS->GArray[i].Index;
	2103	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	2104	destpos = &tempdestRC[LevS->MaxNUp*Index];
	2105	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2106	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
	2107	destpos[pos].re = LevS->GArray[i].G[index_g]((Psi[i].im)posfac[pos].re-(-Psi[i].re)*posfac[pos].im);
	2108	destpos[pos].im = LevS->GArray[i].G[index_g]((Psi[i].im)posfac[pos].im+(-Psi[i].re)*posfac[pos].re);
	2109	}
	2110	}
	2111	break;
	2112	}
	2113	for (i=0; i<LevS->MaxDoubleG; i++) {
	2114	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
	2115	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
	2116	for (pos=0; pos < LevS->MaxNUp; pos++) {
	2117	//if (destRCD != &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp] \|\| LevS->DoubleG[2i+1]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2i+1]LevS->MaxNUp+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destRCD corrupted");
	2118	destRCD[pos].re = destRCS[pos].re;
	2119	destRCD[pos].im = -destRCS[pos].im;
	2120	}
	2121	}
	2122	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
	2123	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, PsiR);
	2124	UnLockDensityArray(Dens0,TempDensity,imag); // tempdestRC
	2125	}
	2126
	2127	/** Locks all NDIM_NDIM current density arrays
	2128	* \param Dens0 Density structure to be locked (in the current parts)
	2129	*/
	2130	void AllocCurrentDensity(struct Density *Dens0) {
	2131	// real
	2132	LockDensityArray(Dens0,CurrentDensity0,real); // CurrentDensity[B_index]
	2133	LockDensityArray(Dens0,CurrentDensity1,real); // CurrentDensity[B_index]
	2134	LockDensityArray(Dens0,CurrentDensity2,real); // CurrentDensity[B_index]
	2135	LockDensityArray(Dens0,CurrentDensity3,real); // CurrentDensity[B_index]
	2136	LockDensityArray(Dens0,CurrentDensity4,real); // CurrentDensity[B_index]
	2137	LockDensityArray(Dens0,CurrentDensity5,real); // CurrentDensity[B_index]
	2138	LockDensityArray(Dens0,CurrentDensity6,real); // CurrentDensity[B_index]
	2139	LockDensityArray(Dens0,CurrentDensity7,real); // CurrentDensity[B_index]
	2140	LockDensityArray(Dens0,CurrentDensity8,real); // CurrentDensity[B_index]
	2141	// imaginary
	2142	LockDensityArray(Dens0,CurrentDensity0,imag); // CurrentDensity[B_index]
	2143	LockDensityArray(Dens0,CurrentDensity1,imag); // CurrentDensity[B_index]
	2144	LockDensityArray(Dens0,CurrentDensity2,imag); // CurrentDensity[B_index]
	2145	LockDensityArray(Dens0,CurrentDensity3,imag); // CurrentDensity[B_index]
	2146	LockDensityArray(Dens0,CurrentDensity4,imag); // CurrentDensity[B_index]
	2147	LockDensityArray(Dens0,CurrentDensity5,imag); // CurrentDensity[B_index]
	2148	LockDensityArray(Dens0,CurrentDensity6,imag); // CurrentDensity[B_index]
	2149	LockDensityArray(Dens0,CurrentDensity7,imag); // CurrentDensity[B_index]
	2150	LockDensityArray(Dens0,CurrentDensity8,imag); // CurrentDensity[B_index]
	2151	}
	2152
	2153	/** Reset and unlocks all NDIM_NDIM current density arrays
	2154	* \param Dens0 Density structure to be unlocked/resetted (in the current parts)
	2155	*/
	2156	void DisAllocCurrentDensity(struct Density *Dens0) {
	2157	//int i;
	2158	// real
	2159	// for(i=0;i<NDIM*NDIM;i++)
	2160	// SetArrayToDouble0((double )Dens0->DensityArray[i], Dens0->TotalSize2);
	2161	UnLockDensityArray(Dens0,CurrentDensity0,real); // CurrentDensity[B_index]
	2162	UnLockDensityArray(Dens0,CurrentDensity1,real); // CurrentDensity[B_index]
	2163	UnLockDensityArray(Dens0,CurrentDensity2,real); // CurrentDensity[B_index]
	2164	UnLockDensityArray(Dens0,CurrentDensity3,real); // CurrentDensity[B_index]
	2165	UnLockDensityArray(Dens0,CurrentDensity4,real); // CurrentDensity[B_index]
	2166	UnLockDensityArray(Dens0,CurrentDensity5,real); // CurrentDensity[B_index]
	2167	UnLockDensityArray(Dens0,CurrentDensity6,real); // CurrentDensity[B_index]
	2168	UnLockDensityArray(Dens0,CurrentDensity7,real); // CurrentDensity[B_index]
	2169	UnLockDensityArray(Dens0,CurrentDensity8,real); // CurrentDensity[B_index]
	2170	// imaginary
	2171	// for(i=0;i<NDIM*NDIM;i++)
	2172	// SetArrayToDouble0((double )Dens0->DensityCArray[i], Dens0->TotalSize2);
	2173	UnLockDensityArray(Dens0,CurrentDensity0,imag); // CurrentDensity[B_index]
	2174	UnLockDensityArray(Dens0,CurrentDensity1,imag); // CurrentDensity[B_index]
	2175	UnLockDensityArray(Dens0,CurrentDensity2,imag); // CurrentDensity[B_index]
	2176	UnLockDensityArray(Dens0,CurrentDensity3,imag); // CurrentDensity[B_index]
	2177	UnLockDensityArray(Dens0,CurrentDensity4,imag); // CurrentDensity[B_index]
	2178	UnLockDensityArray(Dens0,CurrentDensity5,imag); // CurrentDensity[B_index]
	2179	UnLockDensityArray(Dens0,CurrentDensity6,imag); // CurrentDensity[B_index]
	2180	UnLockDensityArray(Dens0,CurrentDensity7,imag); // CurrentDensity[B_index]
	2181	UnLockDensityArray(Dens0,CurrentDensity8,imag); // CurrentDensity[B_index]
	2182	}
	2183
	2184	// these defines safe-guard same symmetry for same kind of wave function
	2185	#define Psi0symmetry 0 // //0 //0 //0 // regard psi0 as real
	2186	#define Psi1symmetry 0 // //3 //0 //0 // regard psi0 as real
	2187	#define Psip0symmetry 6 //6 //6 //6 //6 // momentum times "i" due to operation on left hand
	2188	#define Psip1symmetry 7 //7 //4 //6 //7 // momentum times "-i" as usual (right hand)
	2189
	2190	/** Evaluates the 3x3 current density arrays.
	2191	* The formula we want to evaluate is as follows
	2192	* \f[
	2193	* j_k(r) = \langle \psi_k^{(0)} \| \Bigl ( p\|r'\rangle\langle r' \| + \| r' \rangle \langle r' \| p \Bigr )
	2194	\Bigl [ \| \psi_k^{(r\times p )} \rangle - r' \times \| \psi_k^{(p)} \rangle \Bigr ] \cdot B.
	2195	* \f]
	2196	* Most of the DensityTypes-arrays are locked for temporary use. Pointers are set to their
	2197	* start address and afterwards the current density arrays locked and reset'ed. Then for every
	2198	* unperturbed wave function we do:
	2199	* -# FFT unperturbed p-perturbed and rxp-perturbed wave function
	2200	* -# FFT wave function with applied momentum operator for all three indices
	2201	* -# For each index of the momentum operator:
	2202	* -# FFT p-perturbed wave function
	2203	* -# For every index of the external field:
	2204	* -# FFT rxp-perturbed wave function
	2205	* -# Evaluate current density for these momentum index and external field indices
	2206	*
	2207	* Afterwards the temporary densities are unlocked and the density ones gathered from all Psi-
	2208	* sharing processes.
	2209	*
	2210	* \param *P Problem at hand, containing Lattice and RunStruct
	2211	*/
	2212	void FillCurrentDensity(struct Problem *P)
	2213	{
	2214	struct Lattice *Lat = &P->Lat;
	2215	struct RunStruct *R = &P->R;
	2216	struct Psis *Psi = &Lat->Psi;
	2217	struct LatticeLevel *LevS = R->LevS;
	2218	struct LatticeLevel *Lev0 = R->Lev0;
	2219	struct Density *Dens0 = Lev0->Dens;
	2220	fftw_complex *Psi0;
	2221	fftw_real Psi0R, Psip0R;
	2222	fftw_real CurrentDensity[NDIMNDIM];
	2223	fftw_real *Psi1R;
	2224	fftw_real *Psip1R;
	2225	fftw_real *tempArray; // intendedly the same
	2226	double r_bar[NDIM], x[NDIM], fac[NDIM];
	2227	double Current;//, current;
	2228	const double UnitsFactor = 1.; ///LevS->MaxN; // 1/N (from ff-backtransform)
	2229	int i, index, B_index;
	2230	int k, j, i0;
	2231	int n[NDIM], n0;
	2232	int N[NDIM];
	2233	N[0] = Lev0->Plan0.plan->N[0];
	2234	N[1] = Lev0->Plan0.plan->N[1];
	2235	N[2] = Lev0->Plan0.plan->N[2];
	2236	const int N0 = Lev0->Plan0.plan->local_nx;
	2237	//int ActNum;
	2238	const int myPE = P->Par.me_comm_ST_Psi;
	2239	const int type = R->CurrentMin;
	2240	MPI_Status status;
	2241	int cross_lookup_1[4], cross_lookup_3[4], l_1 = 0, l_3 = 0;
	2242
	2243	//fprintf(stderr,"(%i) FactoR %e\n", P->Par.me, R->FactorDensityR);
	2244
	2245	// Init values and pointers
	2246	if (P->Call.out[PsiOut]) {
	2247	fprintf(stderr,"(%i) LockArray: ", P->Par.me);
	2248	for(i=0;i<MaxDensityTypes;i++)
	2249	fprintf(stderr,"(%i,%i) ",Dens0->LockArray[i],Dens0->LockCArray[i]);
	2250	fprintf(stderr,"\n");
	2251	}
	2252	LockDensityArray(Dens0,Temp2Density,real); // Psi1R
	2253	LockDensityArray(Dens0,Temp2Density,imag); // Psip1R and tempArray
	2254	LockDensityArray(Dens0,GapDensity,real); // Psi0R
	2255	LockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
	2256
	2257	Psi0R = (fftw_real *)Dens0->DensityArray[GapDensity];
	2258	Psip0R = (fftw_real *)Dens0->DensityArray[GapLocalDensity];
	2259	Psi1R = (fftw_real *)Dens0->DensityArray[Temp2Density];
	2260	tempArray = Psip1R = (fftw_real *)Dens0->DensityCArray[Temp2Density];
	2261	SetArrayToDouble0((double )Psi0R,Dens0->TotalSize2);
	2262	SetArrayToDouble0((double )Psip0R,Dens0->TotalSize2);
	2263	SetArrayToDouble0((double )Psi1R,Dens0->TotalSize2);
	2264	SetArrayToDouble0((double )Psip1R,Dens0->TotalSize2);
	2265
	2266	if (P->Call.out[PsiOut]) {
	2267	fprintf(stderr,"(%i) LockArray: ", P->Par.me);
	2268	for(i=0;i<MaxDensityTypes;i++)
	2269	fprintf(stderr,"(%i,%i) ",Dens0->LockArray[i],Dens0->LockCArray[i]);
	2270	fprintf(stderr,"\n");
	2271	}
	2272
	2273	// don't put the following stuff into a for loop, they might not be continuous! (preprocessor values: CurrentDensity...)
	2274	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	2275	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	2276	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	2277	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	2278	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	2279	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	2280	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	2281	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	2282	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	2283
	2284	// initialize the array if it is the first of all six perturbation run
	2285	if ((R->DoFullCurrent == 0) && (R->CurrentMin == Perturbed_P0)) { // reset if FillDelta...() hasn't done it before
	2286	debug(P,"resetting CurrentDensity...");
	2287	for (B_index=0; B_index<NDIM*NDIM; B_index++) // initialize current density array
	2288	SetArrayToDouble0((double )CurrentDensity[B_index],Dens0->TotalSize2); // DensityArray is fftw_real, no 2*LocalSizeR here!
	2289	}
	2290
	2291	switch(type) { // set j (which is linked to the index from derivation wrt to B^{ext})
	2292	case Perturbed_P0:
	2293	case Perturbed_P1:
	2294	case Perturbed_P2:
	2295	j = type - Perturbed_P0;
	2296	l_1 = crossed(j,1);
	2297	l_3 = crossed(j,3);
	2298	for(k=0;k<4;k++) {
	2299	cross_lookup_1[k] = cross(l_1,k);
	2300	cross_lookup_3[k] = cross(l_3,k);
	2301	}
	2302	break;
	2303	case Perturbed_RxP0:
	2304	case Perturbed_RxP1:
	2305	case Perturbed_RxP2:
	2306	j = type - Perturbed_RxP0;
	2307	break;
	2308	default:
	2309	j = 0;
	2310	Error(SomeError,"FillCurrentDensity() called while not in perturbed minimisation!");
	2311	break;
	2312	}
	2313
	2314	int wished = -1;
	2315	FILE *file = fopen(P->Call.MainParameterFile,"r");
[961b75]	2316	if (!ParseForParameter(1,file,"Orbital",0,1,1,int_type,&wished, 1, optional)) {
[a0bcf1]	2317	fprintf(stderr,"Desired Orbital missing!\n");
	2318	wished = -1;
	2319	} else if (wished != -1) {
	2320	fprintf(stderr,"Desired Orbital is: %i.\n", wished);
	2321	} else {
	2322	fprintf(stderr,"Desired Orbital is: All.\n");
	2323	}
	2324	fclose(file);
	2325
	2326	// Commence grid filling
	2327	for (k=Psi->TypeStartIndex[Occupied];k<Psi->TypeStartIndex[Occupied+1];k++) // every local wave functions adds up its part of the current
	2328	if ((k + P->Par.me_comm_ST_PsiT*(Psi->TypeStartIndex[UnOccupied]-Psi->TypeStartIndex[Occupied]) == wished) \|\| (wished == -1)) { // compare with global number
	2329	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i)Calculating Current Density Summand of type %s for Psi (%i/%i) ... \n", P->Par.me, R->MinimisationName[type], Psi->LocalPsiStatus[k].MyGlobalNo, k);
	2330	//ActNum = k - Psi->TypeStartIndex[Occupied] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[k].my_color_comm_ST_Psi; // global number of unperturbed Psi
	2331	Psi0 = LevS->LPsi->LocalPsi[k]; // Local unperturbed psi
	2332
	2333	// now some preemptive ffts for the whole grid
	2334	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi0> one level up and fftransforming\n", P->Par.me);
	2335	fft_Psi(P, Psi0, Psi0R, 0, Psi0symmetry); //0 // 0 //0
	2336
	2337	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi1> one level up and fftransforming\n", P->Par.me);
	2338	fft_Psi(P, LevS->LPsi->LocalPsi[Psi->TypeStartIndex[type]+k], Psi1R, 0, Psi1symmetry); //3 //0 //0
	2339
	2340	for (index=0;index<NDIM;index++) { // for all NDIM components of momentum operator
	2341
	2342	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi0> one level up and fftransforming\n", P->Par.me);
	2343	fft_Psi(P, Psi0, Psip0R, index, Psip0symmetry); //6 //6 //6
	2344
	2345	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi1> one level up and fftransforming\n", P->Par.me);
	2346	fft_Psi(P, LevS->LPsi->LocalPsi[Psi->TypeStartIndex[type]+k], Psip1R, index, Psip1symmetry); //4 //6 //7
	2347
	2348	// then for every point on the grid in real space ...
	2349
	2350	//if (Psi1R != (fftw_real *)Dens0->DensityArray[Temp2Density] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"fft_Psi: Psi1R corrupted");
	2351	//Psi1R[i0] = (Psi1_rxp_R[j])[i0] - (r_bar[cross(j,0)] * (Psi1_p_R[cross(j,1)])[i0] - r_bar[cross(j,2)] * (Psi1_p_R[cross(j,3)])[i0]); //
	2352	//if (Psip1R != (fftw_real *)Dens0->DensityCArray[Temp2Density] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"fft_Psi: Psip1R corrupted");
	2353	//Psip1R[i0] = Psi1_rxp_pR[i0] - (r_bar[cross(j,0)] * (Psi1_p_pR[cross(j,1)])[i0] - r_bar[cross(j,2)] * (Psi1_p_pR[cross(j,3)])[i0]); //
	2354
	2355	switch(type) {
	2356	case Perturbed_P0:
	2357	case Perturbed_P1:
	2358	case Perturbed_P2:
	2359	for (n0=0;n0<N0;n0++) // only local points on x axis
	2360	for (n[1]=0;n[1]<N[1];n[1]++)
	2361	for (n[2]=0;n[2]<N[2];n[2]++) {
	2362	i0 = n[2]+N[2](n[1]+N[1]n0);
	2363	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
	2364	fac[0] = (double)n[0]/(double)N[0];
	2365	fac[1] = (double)n[1]/(double)N[1];
	2366	fac[2] = (double)n[2]/(double)N[2];
	2367	RMat33Vec3(x, Lat->RealBasis, fac); // relative coordinate times basis matrix gives absolute ones
	2368	for (i=0;i<NDIM;i++) // build gauge-translated r_bar evaluation point
	2369	r_bar[i] =
	2370	sawtooth(Lat,MinImageConv(Lat, x[i], Psi->AddData[k].WannierCentre[i], i),i);
	2371	// ShiftGaugeOrigin(P,truedist(Lat, x[i], Psi->AddData[k].WannierCentre[i], i),i);
	2372	//truedist(Lat, x[i], Psi->AddData[k].WannierCentre[i], i);
	2373
	2374	Current = Psip0R[i0] * (r_bar[cross_lookup_1[0]] * Psi1R[i0]);
	2375	Current += (Psi0R[i0] * r_bar[cross_lookup_1[0]] * Psip1R[i0]);
	2376	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
	2377	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2378	CurrentDensity[index+l_1*NDIM][i0] -= Current; // note: sign of cross product resides in Current itself (here: plus)
	2379
	2380	Current = - Psip0R[i0] * (r_bar[cross_lookup_3[2]] * Psi1R[i0]);
	2381	Current += - (Psi0R[i0] * r_bar[cross_lookup_3[2]] * Psip1R[i0]);
	2382	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
	2383	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2384	CurrentDensity[index+l_3*NDIM][i0] -= Current; // note: sign of cross product resides in Current itself (here: minus)
	2385	}
	2386	break;
	2387	case Perturbed_RxP0:
	2388	case Perturbed_RxP1:
	2389	case Perturbed_RxP2:
	2390	for (n0=0;n0<N0;n0++) // only local points on x axis
	2391	for (n[1]=0;n[1]<N[1];n[1]++)
	2392	for (n[2]=0;n[2]<N[2];n[2]++) {
	2393	i0 = n[2]+N[2](n[1]+N[1]n0);
	2394	Current = (Psip0R[i0] * Psi1R[i0] + Psi0R[i0] * Psip1R[i0]);
	2395	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
	2396	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2397	CurrentDensity[index+j*NDIM][i0] += Current;
	2398	}
	2399	break;
	2400	default:
	2401	break;
	2402	}
	2403	}
	2404	//OutputCurrentDensity(P);
	2405	}
	2406
	2407	//debug(P,"Unlocking arrays");
	2408	//debug(P,"GapDensity");
	2409	UnLockDensityArray(Dens0,GapDensity,real); // Psi0R
	2410	//debug(P,"GapLocalDensity");
	2411	UnLockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
	2412	//debug(P,"Temp2Density");
	2413	UnLockDensityArray(Dens0,Temp2Density,real); // Psi1R
	2414
	2415	// if (P->Call.out[StepLeaderOut])
	2416	// fprintf(stderr,"\n\n");
	2417
	2418	//debug(P,"MPI operation");
	2419	// and in the end gather partial densities from other processes
	2420	if (type == Perturbed_RxP2) // exchange all (due to shared wave functions) only after last pertubation run
	2421	for (index=0;index<NDIM*NDIM;index++) {
	2422	//if (tempArray != (fftw_real *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"FillCurrentDensity: tempArray corrupted");
	2423	//debug(P,"tempArray to zero");
	2424	SetArrayToDouble0((double )tempArray, Dens0->TotalSize2);
	2425	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index]) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2426	//debug(P,"CurrentDensity exchange");
	2427	MPI_Allreduce( CurrentDensity[index], tempArray, Dens0->LocalSizeR, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_PsiT); // gather results from all wave functions ...
	2428	switch(Psi->PsiST) { // ... and also from SpinUp/Downs
	2429	default:
	2430	//debug(P,"CurrentDensity = tempArray");
	2431	for (i=0;i<Dens0->LocalSizeR;i++) {
	2432	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2433	CurrentDensity[index][i] = tempArray[i];
	2434	}
	2435	break;
	2436	case SpinUp:
	2437	//debug(P,"CurrentDensity exchange spinup");
	2438	MPI_Sendrecv(tempArray, Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag1,
	2439	CurrentDensity[index], Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag2, P->Par.comm_STInter, &status );
	2440	//debug(P,"CurrentDensity += tempArray");
	2441	for (i=0;i<Dens0->LocalSizeR;i++) {
	2442	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2443	CurrentDensity[index][i] += tempArray[i];
	2444	}
	2445	break;
	2446	case SpinDown:
	2447	//debug(P,"CurrentDensity exchange spindown");
	2448	MPI_Sendrecv(tempArray, Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag2,
	2449	CurrentDensity[index], Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag1, P->Par.comm_STInter, &status );
	2450	//debug(P,"CurrentDensity += tempArray");
	2451	for (i=0;i<Dens0->LocalSizeR;i++) {
	2452	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2453	CurrentDensity[index][i] += tempArray[i];
	2454	}
	2455	break;
	2456	}
	2457	}
	2458	//debug(P,"Temp2Density");
	2459	UnLockDensityArray(Dens0,Temp2Density,imag); // Psip1R and tempArray
	2460	//debug(P,"CurrentDensity end");
	2461	}
	2462
	2463	/** Structure holding Problem at hand and two indices, defining the greens function to be inverted.
	2464	*/
	2465	struct params
	2466	{
	2467	struct Problem *P;
	2468	int *k;
	2469	int *l;
	2470	int *iter;
	2471	fftw_complex *x_l;
	2472	};
	2473
	2474	/** Wrapper function to solve G_kl x = b for x.
	2475	* \param *x above x
	2476	* \param *param additional parameters, here Problem at hand
	2477	* \return evaluated to be minimized functional \f$\frac{1}{2}x \cdot Ax - xb\f$ at \a x on return
	2478	*/
	2479	static double DeltaCurrent_f(const gsl_vector * x, void * param)
	2480	{
	2481	struct Problem P = ((struct params )param)->P;
	2482	struct RunStruct *R = &P->R;
	2483	struct LatticeLevel *LevS = R->LevS;
	2484	struct Psis *Psi = &P->Lat.Psi;
	2485	struct PseudoPot *PP = &P->PP;
	2486	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
	2487	double result = 0.;
	2488	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
	2489	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
	2490	int u;
	2491
	2492	//fprintf(stderr,"Evaluating f(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
	2493
	2494	// extract gsl_vector
	2495	for (u=0;u<LevS->MaxG;u++) {
	2496	TempPsi[u].re = gsl_vector_get(x, 2*u);
	2497	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
	2498	}
	2499	// generate fnl
	2500	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
	2501	// Apply Hamiltonian to x
	2502	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
	2503	// take scalar product to get eigen value
	2504	result = .5 * PsiFactor * (((((struct params )param)->k == ((struct params )param)->l ? GradSP(P,LevS,TempPsi,TempPsi2) : 0.) - Psi->lambda[((struct params )param)->k][((struct params )param)->l])) - GradSP(P,LevS,TempPsi,LevS->LPsi->LocalPsi[((struct params )param)->l]);
	2505	return result;
	2506	}
	2507
	2508	/** Wrapper function to solve G_kl x = b for x.
	2509	* \param *x above x
	2510	* \param *param additional parameters, here Problem at hand
	2511	* \param *g gradient vector on return
	2512	* \return error code
	2513	*/
	2514	static void DeltaCurrent_df(const gsl_vector * x, void * param, gsl_vector * g)
	2515	{
	2516	struct Problem P = ((struct params )param)->P;
	2517	struct RunStruct *R = &P->R;
	2518	struct LatticeLevel *LevS = R->LevS;
	2519	struct Psis *Psi = &P->Lat.Psi;
	2520	struct PseudoPot *PP = &P->PP;
	2521	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
	2522	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
	2523	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
	2524	fftw_complex x_l = ((struct params )param)->x_l;
	2525	int u;
	2526
	2527	//fprintf(stderr,"Evaluating df(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
	2528
	2529	// extract gsl_vector
	2530	for (u=0;u<LevS->MaxG;u++) {
	2531	TempPsi[u].re = gsl_vector_get(x, 2*u);
	2532	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
	2533	}
	2534	// generate fnl
	2535	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
	2536	// Apply Hamiltonian to x
	2537	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
	2538	// put into returning vector
	2539	for (u=0;u<LevS->MaxG;u++) {
	2540	gsl_vector_set(g, 2*u, TempPsi2[u].re - x_l[u].re);
	2541	gsl_vector_set(g, 2*u+1, TempPsi2[u].im - x_l[u].im);
	2542	}
	2543	}
	2544
	2545	/** Wrapper function to solve G_kl x = b for x.
	2546	* \param *x above x
	2547	* \param *param additional parameters, here Problem at hand
	2548	* \param *f evaluated to be minimized functional \f$\frac{1}{2}x \cdot Ax - xb\f$ at \a x on return
	2549	* \param *g gradient vector on return
	2550	* \return error code
	2551	*/
	2552	static void DeltaCurrent_fdf(const gsl_vector * x, void * param, double * f, gsl_vector * g)
	2553	{
	2554	struct Problem P = ((struct params )param)->P;
	2555	struct RunStruct *R = &P->R;
	2556	struct LatticeLevel *LevS = R->LevS;
	2557	struct Psis *Psi = &P->Lat.Psi;
	2558	struct PseudoPot *PP = &P->PP;
	2559	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
	2560	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
	2561	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
	2562	fftw_complex x_l = ((struct params )param)->x_l;
	2563	int u;
	2564
	2565	//fprintf(stderr,"Evaluating fdf(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
	2566
	2567	// extract gsl_vector
	2568	for (u=0;u<LevS->MaxG;u++) {
	2569	TempPsi[u].re = gsl_vector_get(x, 2*u);
	2570	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
	2571	}
	2572	// generate fnl
	2573	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
	2574	// Apply Hamiltonian to x
	2575	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
	2576	// put into returning vector
	2577	for (u=0;u<LevS->MaxG;u++) {
	2578	gsl_vector_set(g, 2*u, TempPsi[u].re - x_l[u].re);
	2579	gsl_vector_set(g, 2*u+1, TempPsi[u].im - x_l[u].im);
	2580	}
	2581
	2582	f = .5 PsiFactor * (((((struct params )param)->k == ((struct params )param)->l ? GradSP(P,LevS,TempPsi,TempPsi2) : 0.) - Psi->lambda[((struct params )param)->k][((struct params )param)->l])) - GradSP(P,LevS,TempPsi,LevS->LPsi->LocalPsi[((struct params )param)->l]);
	2583	}
	2584
	2585	/** Evaluates the \f$\Delta j_k(r')\f$ component of the current density.
	2586	* \f[
	2587	* \Delta j_k(r') = \frac{e}{m} \sum_l \langle \varphi^{(0)}_k \| \left ( p \|r'\rangle \langle r'\| + \| r'\rangle\langle r'\|p \right ) {\cal G}_{kl} (d_k - d_l) \times p \| \varphi^{(1)}_l \rangle \cdot B
	2588	* \f]
	2589	* \param *P Problem at hand
	2590	* \note result has not yet been MPI_Allreduced for ParallelSimulationData#comm_ST_inter or ParallelSimulationData#comm_ST_PsiT groups!
	2591	* \warning the routine is checked but does not yet produce sensible results.
	2592	*/
	2593	void FillDeltaCurrentDensity(struct Problem *P)
	2594	{
	2595	struct Lattice *Lat = &P->Lat;
	2596	struct RunStruct *R = &P->R;
	2597	struct Psis *Psi = &Lat->Psi;
	2598	struct LatticeLevel *Lev0 = R->Lev0;
	2599	struct LatticeLevel *LevS = R->LevS;
	2600	struct Density *Dens0 = Lev0->Dens;
	2601	int i,j,s;
	2602	int k,l,u, in, dex, index,i0;
	2603	//const int Num = Psi->NoOfPsis;
	2604	int RecvSource;
	2605	MPI_Status status;
	2606	struct OnePsiElement OnePsiB, LOnePsiB, OnePsiA, LOnePsiA;
	2607	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
	2608	int n[NDIM], n0;
	2609	int N[NDIM];
	2610	N[0] = Lev0->Plan0.plan->N[0];
	2611	N[1] = Lev0->Plan0.plan->N[1];
	2612	N[2] = Lev0->Plan0.plan->N[2];
	2613	const int N0 = Lev0->Plan0.plan->local_nx;
	2614	fftw_complex *LPsiDatB;
	2615	fftw_complex Psi0, Psi1;
	2616	fftw_real Psi0R, Psip0R;
	2617	fftw_real Psi1R, Psip1R;
	2618	fftw_complex x_l = LevS->LPsi->TempPsi;//, *x_l_bak;
	2619	fftw_real CurrentDensity[NDIMNDIM];
	2620	int mem_avail, MEM_avail;
	2621	double Current;
	2622	const double UnitsFactor = 1.;
	2623	int cross_lookup[4];
	2624	struct params param;
	2625	double factor; // temporary factor in Psi1 pre-evaluation
	2626
	2627	LockDensityArray(Dens0,GapDensity,real); // Psi0R
	2628	LockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
	2629	LockDensityArray(Dens0,Temp2Density,imag); // Psi1
	2630	LockDensityArray(Dens0,GapUpDensity,real); // Psi1R
	2631	LockDensityArray(Dens0,GapDownDensity,real); // Psip1R
	2632
	2633	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	2634	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	2635	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	2636	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	2637	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	2638	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	2639	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	2640	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	2641	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	2642
	2643	Psi0R = (fftw_real *)Dens0->DensityArray[GapDensity];
	2644	Psip0R = (fftw_real *)Dens0->DensityArray[GapLocalDensity];
	2645	Psi1 = (fftw_complex *) Dens0->DensityCArray[Temp2Density];
	2646	Psi1R = (fftw_real *)Dens0->DensityArray[GapUpDensity];
	2647	Psip1R = (fftw_real *)Dens0->DensityArray[GapDownDensity];
	2648
	2649	// if (R->CurrentMin == Perturbed_P0)
	2650	// for (B_index=0; B_index<NDIM*NDIM; B_index++) { // initialize current density array
	2651	// debug(P,"resetting CurrentDensity...");
	2652	// SetArrayToDouble0((double )CurrentDensity[B_index],Dens0->TotalSize2); // DensityArray is fftw_real, no 2*LocalSizeR here!
	2653	// }
	2654	//if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density]) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
	2655	SetArrayToDouble0((double )Psi1,2Dens0->TotalSize);
	2656
	2657	// gsl_vector *x = gsl_vector_alloc(Num);
	2658	// gsl_matrix *G = gsl_matrix_alloc(Num,Num);
	2659	// gsl_permutation *p = gsl_permutation_alloc(Num);
	2660	//int signum;
	2661	// begin of GSL linearer CG solver stuff
	2662	int iter, Status;
	2663
	2664	const gsl_multimin_fdfminimizer_type *T;
	2665	gsl_multimin_fdfminimizer *minset;
	2666
	2667	/* Position of the minimum (1,2). */
	2668	//double par[2] = { 1.0, 2.0 };
	2669
	2670	gsl_vector *x;
	2671	gsl_multimin_function_fdf my_func;
	2672
	2673	param.P = P;
	2674	param.k = &k;
	2675	param.l = &l;
	2676	param.iter = &iter;
	2677	param.x_l = x_l;
	2678
	2679	my_func.f = &DeltaCurrent_f;
	2680	my_func.df = &DeltaCurrent_df;
	2681	my_func.fdf = &DeltaCurrent_fdf;
	2682	my_func.n = 2*LevS->MaxG;
	2683	my_func.params = (void *)&param;
	2684
	2685	T = gsl_multimin_fdfminimizer_conjugate_pr;
	2686	minset = gsl_multimin_fdfminimizer_alloc (T, 2*LevS->MaxG);
	2687	x = gsl_vector_alloc (2*LevS->MaxG);
	2688	// end of GSL CG stuff
	2689
	2690
	2691	// // construct G_kl = - (H^{(0)} \delta_{kl} -\langle \varphi^{(0)}_k \|H^{(0)}\| \varphi^{(0)}_l\|rangle)^{-1} = A^{-1}
	2692	// for (k=0;k<Num;k++)
	2693	// for (l=0;l<Num;l++)
	2694	// gsl_matrix_set(G, k, l, k == l ? 0. : Psi->lambda[k][l]);
	2695	// // and decompose G_kl = L U
	2696
	2697	mem_avail = MEM_avail = 0;
	2698	// x_l_bak = x_l = (fftw_complex *) Malloc(sizeof(fftw_complex )Num,"FillDeltaCurrentDensity: x_l");
	2699	// for (i=0;i<Num;i++) {
	2700	// x_l[i] = NULL;
	2701	// x_l[i] = (fftw_complex ) malloc(sizeof(fftw_complex)LevS->MaxG);
	2702	// if (x_l[i] == NULL) {
	2703	// mem_avail = 1; // there was not enough memory for this node
	2704	// fprintf(stderr,"(%i) FillDeltaCurrentDensity: x_l[%i] ... insufficient memory.\n",P->Par.me,i);
	2705	// }
	2706	// }
	2707	// MPI_Allreduce(&mem_avail,&MEM_avail,1,MPI_INT,MPI_SUM,P->Par.comm_ST); // sum results from all processes
	2708
	2709	if (MEM_avail != 0) { // means at least node couldn't allocate sufficient memory, skipping...
	2710	fprintf(stderr,"(%i) FillDeltaCurrentDensity: x_l[], not enough memory: %i! Skipping FillDeltaCurrentDensity evaluation.", P->Par.me, MEM_avail);
	2711	} else {
	2712	// sum over k and calculate \Delta j_k(r')
	2713	k=-1;
	2714	for (i=0; i < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; i++) { // go through all wave functions
	2715	//fprintf(stderr,"(%i) GlobalNo: %d\tLocalNo: %d\n", P->Par.me,Psi->AllPsiStatus[i].MyGlobalNo,Psi->AllPsiStatus[i].MyLocalNo);
	2716	OnePsiA = &Psi->AllPsiStatus[i]; // grab OnePsiA
	2717	if (OnePsiA->PsiType == Occupied) { // drop the extra and perturbed ones
	2718	k++;
	2719	if (OnePsiA->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
	2720	LOnePsiA = &Psi->LocalPsiStatus[OnePsiA->MyLocalNo];
	2721	else
	2722	LOnePsiA = NULL;
	2723	if (LOnePsiA != NULL) {
	2724	Psi0=LevS->LPsi->LocalPsi[OnePsiA->MyLocalNo];
	2725
	2726	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi0> one level up and fftransforming\n", P->Par.me);
	2727	//if (Psi0R != (fftw_real *)Dens0->DensityArray[GapDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psi0R corrupted");
	2728	fft_Psi(P,Psi0,Psi0R, 0, Psi0symmetry); //0 // 0 //0
	2729
	2730	for (in=0;in<NDIM;in++) { // in is the index from derivation wrt to B^{ext}
	2731	l = -1;
	2732	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
	2733	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiA
	2734	if (OnePsiB->PsiType == Occupied)
	2735	l++;
	2736	if ((OnePsiB != OnePsiA) && (OnePsiB->PsiType == Occupied)) { // drop the same and the extra ones
	2737	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
	2738	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
	2739	else
	2740	LOnePsiB = NULL;
	2741	if (LOnePsiB == NULL) { // if it's not local ... receive x from respective process
	2742	RecvSource = OnePsiB->my_color_comm_ST_Psi;
	2743	MPI_Recv( x_l, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, HamiltonianTag, P->Par.comm_ST_PsiT, &status );
	2744	} else { // .. otherwise setup wave function as x ...
	2745	// Evaluate cross product: \epsilon_{ijm} (d_k - d_l)_j p_m \| \varphi^{(0)} \rangle = b_i ... and
	2746	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
	2747	//LPsiDatx=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo+Psi->TypeStartIndex[Perturbed_P0]];
	2748	//CalculatePerturbationOperator_P(P,LPsiDatB,LPsiDatB_p0,cross(in,1),0);
	2749	//CalculatePerturbationOperator_P(P,LPsiDatB,LPsiDatB_p1,cross(in,3),0);
	2750	for (dex=0;dex<4;dex++)
	2751	cross_lookup[dex] = cross(in,dex);
	2752	for(s=0;s<LevS->MaxG;s++) {
	2753	//if (x_l != x_l_bak \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
	2754	factor =
	2755	(MinImageConv(Lat,Psi->AddData[LOnePsiA->MyLocalNo].WannierCentre[cross_lookup[0]],
	2756	Psi->AddData[LOnePsiB->MyLocalNo].WannierCentre[cross_lookup[0]],cross_lookup[0]) * LevS->GArray[s].G[cross_lookup[1]] -
	2757	MinImageConv(Lat,Psi->AddData[LOnePsiA->MyLocalNo].WannierCentre[cross_lookup[2]],
	2758	Psi->AddData[LOnePsiB->MyLocalNo].WannierCentre[cross_lookup[2]],cross_lookup[2]) * LevS->GArray[s].G[cross_lookup[3]]);
	2759	x_l[s].re = factor * (-LPsiDatB[s].im); // switched due to factorization with "-i G"
	2760	x_l[s].im = factor * (LPsiDatB[s].re);
	2761	}
	2762	// ... and send it to all other processes (Max_me... - 1)
	2763	for (u=0;u<P->Par.Max_me_comm_ST_PsiT;u++)
	2764	if (u != OnePsiB->my_color_comm_ST_Psi)
	2765	MPI_Send( x_l, LevS->MaxG*ElementSize, MPI_DOUBLE, u, HamiltonianTag, P->Par.comm_ST_PsiT);
	2766	} // x_l row is now filled (either by receiving result or evaluating it on its own)
	2767	// Solve Ax = b by minimizing 1/2 xAx -xb (gradient is residual Ax - b) with conjugate gradient polak-ribiere
	2768
	2769	debug(P,"fill starting point x with values from b");
	2770	/* Starting point, x = b */
	2771	for (u=0;u<LevS->MaxG;u++) {
	2772	gsl_vector_set (x, 2*u, x_l[u].re);
	2773	gsl_vector_set (x, 2*u+1, x_l[u].im);
	2774	}
	2775
	2776	gsl_multimin_fdfminimizer_set (minset, &my_func, x, 0.01, 1e-4);
	2777
	2778	fprintf(stderr,"(%i) Start solving for (%i,%i) and index %i\n",P->Par.me, k,l,in);
	2779	// start solving
	2780	iter = 0;
	2781	do
	2782	{
	2783	iter++;
	2784	Status = gsl_multimin_fdfminimizer_iterate (minset);
	2785
	2786	if (Status)
	2787	break;
	2788
	2789	Status = gsl_multimin_test_gradient (minset->gradient, 1e-3);
	2790
	2791	if (Status == GSL_SUCCESS)
	2792	fprintf (stderr,"(%i) Minimum found after %i iterations.\n", P->Par.me, iter);
	2793
	2794	} while (Status == GSL_CONTINUE && iter < 100);
	2795
	2796	debug(P,"Put solution into Psi1");
	2797	// ... and what do we do now? Put solution into Psi1!
	2798	for(s=0;s<LevS->MaxG;s++) {
	2799	//if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density] \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
	2800	Psi1[s].re = gsl_vector_get (minset->x, 2*s);
	2801	Psi1[s].im = gsl_vector_get (minset->x, 2*s+1);
	2802	}
	2803
	2804	// // Solve A^{-1} b_i = x
	2805	// for(s=0;s<LevS->MaxG;s++) {
	2806	// // REAL PART
	2807	// // retrieve column from gathered matrix
	2808	// for(u=0;u<Num;u++)
	2809	// gsl_vector_set(x,u,x_l[u][s].re);
	2810	//
	2811	// // solve: sum_l A_{kl}^(-1) b_l (s) = x_k (s)
	2812	// gsl_linalg_LU_svx (G, p, x);
	2813	//
	2814	// // put solution back into x_l[s]
	2815	// for(u=0;u<Num;u++) {
	2816	// //if (x_l != x_l_bak \|\| s<0 \|\| s>=LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
	2817	// x_l[u][s].re = gsl_vector_get(x,u);
	2818	// }
	2819	//
	2820	// // IMAGINARY PART
	2821	// // retrieve column from gathered matrix
	2822	// for(u=0;u<Num;u++)
	2823	// gsl_vector_set(x,u,x_l[u][s].im);
	2824	//
	2825	// // solve: sum_l A_{kl}^(-1) b_l (s) = x_k (s)
	2826	// gsl_linalg_LU_svx (G, p, x);
	2827	//
	2828	// // put solution back into x_l[s]
	2829	// for(u=0;u<Num;u++) {
	2830	// //if (x_l != x_l_bak \|\| s<0 \|\| s>=LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
	2831	// x_l[u][s].im = gsl_vector_get(x,u);
	2832	// }
	2833	// } // now we have in x_l a vector similar to "Psi1" which we use to evaluate the current density
	2834	//
	2835	// // evaluate \Delta J_k ... mind the minus sign from G_kl!
	2836	// // fill Psi1
	2837	// for(s=0;s<LevS->MaxG;s++) {
	2838	// //if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density] \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
	2839	// Psi1[s].re = x_l[k][s].re;
	2840	// Psi1[s].im = x_l[k][s].im;
	2841	// }
	2842
	2843	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi1> one level up and fftransforming\n", P->Par.me);
	2844	//if (Psi1R != (fftw_real *)Dens0->DensityArray[GapUpDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psi1R corrupted");
	2845	fft_Psi(P,Psi1,Psi1R, 0, Psi1symmetry); //2 // 0 //0
	2846
	2847	for (index=0;index<NDIM;index++) { // for all NDIM components of momentum operator
	2848
	2849	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi0> one level up and fftransforming\n", P->Par.me);
	2850	//if (Psip0R != (fftw_real *)Dens0->DensityArray[GapLocalDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psip0R corrupted");
	2851	fft_Psi(P,Psi0,Psip0R, index, Psip0symmetry); //6 //6 //6
	2852
	2853	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi1> one level up and fftransforming\n", P->Par.me);
	2854	//if (Psip1R != (fftw_real *)Dens0->DensityArray[GapDownDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psip1R corrupted");
	2855	fft_Psi(P,Psi1,Psip1R, index, Psip1symmetry); //4 //6 //6
	2856
	2857	// then for every point on the grid in real space ...
	2858	for (n0=0;n0<N0;n0++) // only local points on x axis
	2859	for (n[1]=0;n[1]<N[1];n[1]++)
	2860	for (n[2]=0;n[2]<N[2];n[2]++) {
	2861	i0 = n[2]+N[2](n[1]+N[1]n0);
	2862	// and take the product
	2863	Current = (Psip0R[i0] * Psi1R[i0] + Psi0R[i0] * Psip1R[i0]);
	2864	Current = 0.5 UnitsFactor * Psi->AllPsiStatus[OnePsiA->MyGlobalNo].PsiFactor * R->FactorDensityR;
	2865	////if (CurrentDensity[index+inNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+in*NDIM]) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
	2866	//if (i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"FillDeltaCurrentDensity: i0 out of range");
	2867	//if ((index+inNDIM)<0 \|\| (index+inNDIM)>=NDIM*NDIM) Error(SomeError,"FillDeltaCurrentDensity: index out of range");
	2868	CurrentDensity[index+in*NDIM][i0] += Current; // minus sign is from G_kl
	2869	}
	2870	}
	2871	}
	2872	}
	2873	}
	2874	}
	2875	}
	2876	}
	2877	}
	2878	UnLockDensityArray(Dens0,GapDensity,real); // Psi0R
	2879	UnLockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
	2880	UnLockDensityArray(Dens0,Temp2Density,imag); // Psi1
	2881	UnLockDensityArray(Dens0,GapUpDensity,real); // Psi1R
	2882	UnLockDensityArray(Dens0,GapDownDensity,real); // Psip1R
	2883	// for (i=0;i<Num;i++)
[64fa9e]	2884	// if (x_l[i] != NULL) Free(x_l[i], "bla", "bla");
	2885	// Free(x_l, "bla");
[a0bcf1]	2886	gsl_multimin_fdfminimizer_free (minset);
	2887	gsl_vector_free (x);
	2888	// gsl_matrix_free(G);
	2889	// gsl_permutation_free(p);
	2890	// gsl_vector_free(x);
	2891	}
	2892
	2893
	2894	/** Evaluates the overlap integral between \a state wave functions.
	2895	* \f[
	2896	* S_{kl} = \langle \varphi_k^{(1)} \| \varphi_l^{(1)} \rangle
	2897	* \f]
	2898	* The scalar product is calculated via GradSP(), MPI_Allreduced among comm_ST_Psi and the result
	2899	* stored in Psis#Overlap. The rows have to be MPI exchanged, as otherwise processes will add
	2900	* to the TotalEnergy overlaps calculated with old wave functions - they have been minimised after
	2901	* the product with exchanged coefficients was taken.
	2902	* \param *P Problem at hand
	2903	* \param l local number of perturbed wave function.
	2904	* \param state PsiTypeTag minimisation state of wave functions to be overlapped
	2905	*/
	2906	void CalculateOverlap(struct Problem *P, const int l, const enum PsiTypeTag state)
	2907	{
	2908	struct RunStruct *R = &P->R;
	2909	struct Lattice *Lat = &(P->Lat);
	2910	struct Psis *Psi = &Lat->Psi;
	2911	struct LatticeLevel *LevS = R->LevS;
	2912	struct OnePsiElement OnePsiB, LOnePsiB;
	2913	fftw_complex LPsiDatB=NULL, LPsiDatA=NULL;
	2914	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
	2915	int RecvSource;
	2916	MPI_Status status;
	2917	int i,j,m,p;
	2918	//const int l_normal = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
	2919	const int ActNum = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[l].my_color_comm_ST_Psi;
	2920	double sendbuf, recvbuf;
	2921	double tmp,TMP;
	2922	const int gsize = P->Par.Max_me_comm_ST_PsiT; //number of processes in PsiT
	2923	int p_num; // number of wave functions (for overlap)
	2924
	2925	// update overlap table after wave function has changed
	2926	LPsiDatA = LevS->LPsi->LocalPsi[l];
	2927	m = -1; // to access U matrix element (0..Num-1)
	2928	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
	2929	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
	2930	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
	2931	m++; // increase m if it is non-extra wave function
	2932	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
	2933	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
	2934	else
	2935	LOnePsiB = NULL;
	2936	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
	2937	RecvSource = OnePsiB->my_color_comm_ST_Psi;
	2938	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, OverlapTag, P->Par.comm_ST_PsiT, &status );
	2939	LPsiDatB=LevS->LPsi->TempPsi;
	2940	} else { // .. otherwise send it to all other processes (Max_me... - 1)
	2941	for (p=0;p<P->Par.Max_me_comm_ST_PsiT;p++)
	2942	if (p != OnePsiB->my_color_comm_ST_Psi)
	2943	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, p, OverlapTag, P->Par.comm_ST_PsiT);
	2944	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
	2945	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
	2946
	2947	tmp = GradSP(P, LevS, LPsiDatA, LPsiDatB) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * OnePsiB->PsiFactor);
	2948	MPI_Allreduce ( &tmp, &TMP, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
	2949	//fprintf(stderr,"(%i) Setting Overlap [%i][%i] = %lg\n",P->Par.me, ActNum,m,TMP);
	2950	Psi->Overlap[ActNum][m] = TMP; //= Psi->Overlap[m][ActNum]
	2951	}
	2952	}
	2953
	2954	// exchange newly calculated rows among PsiT
	2955	p_num = (m+1) + 1; // number of Psis: one more due to ActNum
	2956	sendbuf = (double ) Malloc(p_num sizeof(double), "CalculateOverlap: sendbuf");
	2957	sendbuf[0] = ActNum; // first entry is the global row number
	2958	for (i=1;i<p_num;i++)
	2959	sendbuf[i] = Psi->Overlap[ActNum][i-1]; // then follow up each entry of overlap row
	2960	recvbuf = (double ) Malloc(gsize p_num * sizeof(double), "CalculateOverlap: recvbuf");
	2961	MPI_Allgather(sendbuf, p_num, MPI_DOUBLE, recvbuf, p_num, MPI_DOUBLE, P->Par.comm_ST_PsiT);
[64fa9e]	2962	Free(sendbuf, "bla");
[a0bcf1]	2963	for (i=0;i<gsize;i++) {// extract results from other processes out of receiving buffer
	2964	m = recvbuf[i*p_num]; // m is ActNum of the process whose results we've just received
	2965	//fprintf(stderr,"(%i) Received row %i from process %i\n", P->Par.me, m, i);
	2966	for (j=1;j<p_num;j++)
	2967	Psi->Overlap[m][j-1] = Psi->Overlap[j-1][m] = recvbuf[i*p_num+j]; // put each entry into correspondent Overlap row
	2968	}
[64fa9e]	2969	Free(recvbuf, "bla");
[a0bcf1]	2970	}
	2971
	2972
	2973	/** Calculates magnetic susceptibility from known current density.
	2974	* The bulk susceptibility tensor can be expressed as a function of the current density.
	2975	* \f[
	2976	* \chi_{ij} = \frac{\mu_0}{2\Omega} \frac{\delta}{\delta B_i^{ext}} \int_\Omega d^3 r \left (r \times j(r) \right )_j
	2977	* \f]
	2978	* Thus the integral over real space and subsequent MPI_Allreduce() over results from ParallelSimulationData#comm_ST_Psi is
	2979	* straightforward. Tensor is diagonalized afterwards and split into its various sub-tensors of lower rank (e.g., isometric
	2980	* value is tensor of rank 0) which are printed to screen and the tensorial elements to file '....chi.csv'
	2981	* \param *P Problem at hand
	2982	*/
	2983	void CalculateMagneticSusceptibility(struct Problem *P)
	2984	{
	2985	struct RunStruct *R = &P->R;
	2986	struct Lattice *Lat = &P->Lat;
	2987	struct LatticeLevel *Lev0 = R->Lev0;
	2988	struct Density *Dens0 = R->Lev0->Dens;
	2989	struct Ions *I = &P->Ion;
	2990	fftw_real CurrentDensity[NDIMNDIM];
	2991	int in, dex, i, i0, n0;
	2992	int n[NDIM];
	2993	const int N0 = Lev0->Plan0.plan->local_nx;
	2994	int N[NDIM];
	2995	N[0] = Lev0->Plan0.plan->N[0];
	2996	N[1] = Lev0->Plan0.plan->N[1];
	2997	N[2] = Lev0->Plan0.plan->N[2];
	2998	double chi[NDIMNDIM],Chi[NDIMNDIM], x[NDIM], fac[NDIM];
	2999	const double discrete_factor = Lat->Volume/Lev0->MaxN;
	3000	const int myPE = P->Par.me_comm_ST_Psi;
	3001	double eta, delta_chi, S, A, iso;
	3002	int cross_lookup[4];
	3003	char filename[256];
	3004	FILE *ChiFile;
	3005	time_t seconds;
	3006	time(&seconds); // get current time
	3007
	3008	// set pointers onto current density
	3009	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	3010	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	3011	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	3012	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	3013	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	3014	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	3015	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	3016	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	3017	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	3018	//for(i=0;i<NDIM;i++) {
	3019	// field[i] = Dens0->DensityArray[TempDensity+i];
	3020	//LockDensityArray(Dens0,TempDensity+i,real);
	3021	// SetArrayToDouble0((double )field[i],Dens0->TotalSize2);
	3022	//}
	3023	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
	3024
	3025
	3026	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) magnetic susceptibility tensor \\Chi_ij = \n",P->Par.me);
	3027	for (in=0; in<NDIM; in++) { // index i of integrand vector component
	3028	for(dex=0;dex<4;dex++) // initialise cross lookup
	3029	cross_lookup[dex] = cross(in,dex);
	3030	for (dex=0; dex<NDIM; dex++) { // index j of derivation wrt B field
	3031	chi[in+dex*NDIM] = 0.;
	3032	// do the integration over real space
	3033	for(n0=0;n0<N0;n0++)
	3034	for(n[1]=0;n[1]<N[1];n[1]++)
	3035	for(n[2]=0;n[2]<N[2];n[2]++) {
	3036	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
	3037	fac[0] = (double)(n[0])/(double)N[0];
	3038	fac[1] = (double)(n[1])/(double)N[1];
	3039	fac[2] = (double)(n[2])/(double)N[2];
	3040	RMat33Vec3(x, Lat->RealBasis, fac);
	3041	i0 = n[2]+N[2](n[1]+N[1](n0)); // the index of current density must match LocalSizeR!
[f5586e]	3042	chi[in+dexNDIM] += MinImageConv(Lat,x[cross_lookup[0]], sqrt(Lat->RealBasisSQ[cross_lookup[0]])/2.,cross_lookup[0]) CurrentDensity[dex*NDIM+cross_lookup[1]][i0]; // x[cross(in,0)], sqrt(Lat->RealBasisSQ[cross_lookup[0]])/2.
	3043	chi[in+dexNDIM] -= MinImageConv(Lat,x[cross_lookup[2]], sqrt(Lat->RealBasisSQ[cross_lookup[2]])/2.,cross_lookup[2]) CurrentDensity[dex*NDIM+cross_lookup[3]][i0]; // x[cross(in,2)], sqrt(Lat->RealBasisSQ[cross_lookup[2]])/2.
[a0bcf1]	3044	// if (in == dex) field[in][i0] =
[f5586e]	3045	// truedist(Lat,x[cross_lookup[0]], sqrt(Lat->RealBasisSQ[c[0]])/2.,cross_lookup[0]) * CurrentDensity[dex*NDIM+cross_lookup[1]][i0]
	3046	// - truedist(Lat,x[cross_lookup[2]], sqrt(Lat->RealBasisSQ[c[2]])/2.,cross_lookup[2]) * CurrentDensity[dex*NDIM+cross_lookup[3]][i0];
	3047	//fprintf(stderr,"(%i) temporary susceptiblity \\chi[%i][%i] += %e * %e = r[%i] * CurrDens[%i][%i] = %e\n",P->Par.me,in,dex,(double)n[cross_lookup[0]]/(double)N[cross_lookup[0]](sqrt(Lat->RealBasisSQ[cross_lookup[0]])),CurrentDensity[dexNDIM+cross_lookup[1]][i0],cross_lookup[0],dexNDIM+cross_lookup[1],i0,chi[inNDIM+dex]);
[a0bcf1]	3048	}
	3049	chi[in+dexNDIM] = mu0discrete_factor/(2.Lat->Volume); // integral factor
	3050	chi[in+dexNDIM] = (-1625.); // empirical gauge factor ... sigh
	3051	MPI_Allreduce ( &chi[in+dexNDIM], &Chi[in+dexNDIM], 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3052	I->I[0].chi[in+dexNDIM] = Chi[in+dexNDIM];
	3053	Chi[in+dexNDIM] = Lat->Volume*loschmidt_constant; // factor for _molar_ susceptibility
	3054	if (P->Call.out[ValueOut]) {
	3055	fprintf(stderr,"%e\t", Chi[in+dex*NDIM]);
	3056	if (dex == NDIM-1) fprintf(stderr,"\n");
	3057	}
	3058	}
	3059	}
	3060	// store symmetrized matrix
	3061	for (in=0;in<NDIM;in++)
	3062	for (dex=0;dex<NDIM;dex++)
	3063	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((Chi[in+dexNDIM]+Chi[dex+inNDIM])/2.,0));
	3064	// output tensor to file
	3065	if (P->Par.me == 0) {
	3066	sprintf(filename, ".chi.L%i.csv", Lev0->LevelNo);
	3067	OpenFile(P, &ChiFile, filename, "a", P->Call.out[ReadOut]);
	3068	fprintf(ChiFile,"# magnetic susceptibility tensor chi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
	3069	fprintf(ChiFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
	3070	for (in=0;in<NDIM*NDIM;in++)
	3071	fprintf(ChiFile,"%e\t", Chi[in]);
	3072	fprintf(ChiFile,"\n");
	3073	fclose(ChiFile);
	3074	}
	3075	// diagonalize chi
	3076	gsl_vector *eval = gsl_vector_alloc(NDIM);
	3077	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
	3078	gsl_eigen_herm(H, eval, w);
	3079	gsl_eigen_herm_free(w);
	3080	gsl_sort_vector(eval); // sort eigenvalues
	3081	// print eigenvalues
	3082	iso = 0;
	3083	for (i=0;i<NDIM;i++) {
	3084	I->I[0].chi_PAS[i] = gsl_vector_get(eval,i);
	3085	iso += Chi[i+i*NDIM]/3.;
	3086	}
	3087	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
	3088	delta_chi = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
	3089	S = (delta_chidelta_chi)(1+1./3.etaeta);
	3090	A = 0.;
	3091	for (i=0;i<NDIM;i++) {
	3092	in = cross(i,0);
	3093	dex = cross(i,1);
	3094	A += pow(-1,i)pow(0.5(Chi[in+dexNDIM]-Chi[dex+inNDIM]),2);
	3095	}
	3096	if (P->Call.out[ValueOut]) {
	3097	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
	3098	for (i=0;i<NDIM;i++)
	3099	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
	3100	fprintf(stderr,"\nsusceptib. : %e\n", iso);
	3101	fprintf(stderr,"anisotropy : %e\n", delta_chi);
	3102	fprintf(stderr,"asymmetry : %e\n", eta);
	3103	fprintf(stderr,"S : %e\n", S);
	3104	fprintf(stderr,"A : %e\n", A);
	3105	fprintf(stderr,"==================\n");
	3106	}
	3107	//for(i=0;i<NDIM;i++)
	3108	//UnLockDensityArray(Dens0,TempDensity+i,real);
	3109	gsl_vector_free(eval);
	3110	gsl_matrix_complex_free(H);
	3111	}
	3112
	3113	/** Fouriertransforms all nine current density components and calculates shielding tensor.
	3114	* \f[
	3115	* \sigma_{ij} = \left ( \frac{G}{\|G\|^2} \times J_i(G) \right )_j
	3116	* \f]
	3117	* The CurrentDensity has to be fouriertransformed to reciprocal subspace in order to be useful, and the final
	3118	* product \f$\sigma_{ij}(G)\f$ has to be back-transformed to real space. However, the shielding is the only evaluated
	3119	* at the grid points and not where the real ion position is. The shieldings there are interpolated between the eight
	3120	* adjacent grid points by a simple linear weighting. Afterwards follows the same analaysis and printout of the rank-2-tensor
	3121	* as in the case of CalculateMagneticShielding().
	3122	* \param *P Problem at hand
	3123	* \note Lots of arrays are used temporarily during the routine for the fft'ed Current density tensor.
	3124	* \note MagneticSusceptibility is needed for G=0-component and thus has to be computed beforehand
	3125	*/
	3126	void CalculateChemicalShieldingByReciprocalCurrentDensity(struct Problem *P)
	3127	{
	3128	struct RunStruct *R = &P->R;
	3129	struct Lattice *Lat = &P->Lat;
	3130	struct LatticeLevel *Lev0 = R->Lev0;
	3131	struct Ions *I = &P->Ion;
	3132	struct Density *Dens0 = Lev0->Dens;
	3133	struct OneGData *GArray = Lev0->GArray;
	3134	struct fft_plan_3d *plan = Lat->plan;
	3135	fftw_real CurrentDensity[NDIMNDIM];
	3136	fftw_complex CurrentDensityC[NDIMNDIM];
	3137	fftw_complex work = (fftw_complex )Dens0->DensityCArray[TempDensity];
	3138	//fftw_complex sigma_imag = (fftw_complex )Dens0->DensityCArray[Temp2Density];
	3139	//fftw_real sigma_real = (fftw_real )sigma_imag;
	3140	fftw_complex *sigma_imag[NDIM_NDIM];
	3141	fftw_real *sigma_real[NDIM_NDIM];
	3142	double sigma,Sigma;
	3143	int it, ion, in, dex, g, n[2][NDIM], Index, i;
	3144	//const double FFTfactor = 1.;///Lev0->MaxN;
	3145	double eta, delta_sigma, S, A, iso, tmp;
	3146	FILE *SigmaFile;
	3147	char suffixsigma[255];
	3148	double x[2][NDIM];
	3149	const int myPE = P->Par.me_comm_ST_Psi;
	3150	int N[NDIM];
	3151	int cross_lookup[4]; // cross lookup table
	3152	N[0] = Lev0->Plan0.plan->N[0];
	3153	N[1] = Lev0->Plan0.plan->N[1];
	3154	N[2] = Lev0->Plan0.plan->N[2];
	3155	const int N0 = Lev0->Plan0.plan->local_nx;
	3156	const double factorDC = R->FactorDensityC;
	3157	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
	3158
	3159	time_t seconds;
	3160	time(&seconds); // get current time
	3161
	3162	// inverse Fourier transform current densities
	3163	CurrentDensityC[0] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity0];
	3164	CurrentDensityC[1] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity1];
	3165	CurrentDensityC[2] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity2];
	3166	CurrentDensityC[3] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity3];
	3167	CurrentDensityC[4] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity4];
	3168	CurrentDensityC[5] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity5];
	3169	CurrentDensityC[6] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity6];
	3170	CurrentDensityC[7] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity7];
	3171	CurrentDensityC[8] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity8];
	3172	// don't put the following stuff into a for loop, they are not continuous! (preprocessor values CurrentDensity.)
	3173	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	3174	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	3175	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	3176	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	3177	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	3178	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	3179	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	3180	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	3181	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	3182
	3183	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Checking J_{ij} (G=0) = 0 for each i,j ... \n",P->Par.me);
	3184	for (in=0;in<NDIM*NDIM;in++) {
	3185	CalculateOneDensityC(Lat, R->LevS, Dens0, CurrentDensity[in], CurrentDensityC[in], factorDC);
	3186	tmp = sqrt(CurrentDensityC[in][0].reCurrentDensityC[in][0].re+CurrentDensityC[in][0].imCurrentDensityC[in][0].im);
	3187	if (GArray[0].GSq < MYEPSILON) {
	3188	if (in % NDIM == 0) fprintf(stderr,"(%i) ",P->Par.me);
	3189	if (tmp > MYEPSILON) {
	3190	fprintf(stderr,"J_{%i,%i} = \|%e + i%e\| < %e ? (%e)\t", in / NDIM, in%NDIM, CurrentDensityC[in][0].re, CurrentDensityC[in][0].im, MYEPSILON, tmp - MYEPSILON);
	3191	} else {
	3192	fprintf(stderr,"J_{%i,%i} ok\t", in / NDIM, in%NDIM);
	3193	}
	3194	if (in % NDIM == (NDIM-1)) fprintf(stderr,"\n");
	3195	}
	3196	}
	3197
	3198	for (in=0;in<NDIM*NDIM;in++) {
	3199	LockDensityArray(Dens0,in,real); // Psi1R
	3200	sigma_imag[in] = (fftw_complex *) Dens0->DensityArray[in];
	3201	sigma_real[in] = (fftw_real *) sigma_imag[in];
	3202	}
	3203
	3204	LockDensityArray(Dens0,TempDensity,imag); // work
	3205	LockDensityArray(Dens0,Temp2Density,imag); // tempdestRC and field
	3206	// go through reciprocal nodes and calculate shielding tensor sigma
	3207	for (in=0; in<NDIM; in++) {// index i of vector component in integrand
	3208	for(dex=0;dex<4;dex++) // initialise cross lookup
	3209	cross_lookup[dex] = cross(in,dex);
	3210	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
	3211	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
	3212	SetArrayToDouble0((double )sigma_imag[in+dexNDIM],Dens0->TotalSize*2);
	3213	for (g=0; g < Lev0->MaxG; g++)
	3214	if (GArray[g].GSq > MYEPSILON) { // skip due to divisor
	3215	Index = GArray[g].Index; // re = im, im = -re due to "i" in formula
	3216	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
	3217	sigma_imag[in+dexNDIM][Index].re = GArray[g].G[cross_lookup[0]] (-CurrentDensityC[dexNDIM+cross_lookup[1]][Index].im)/GArray[g].GSq;//FFTfactor;
	3218	sigma_imag[in+dexNDIM][Index].re -= GArray[g].G[cross_lookup[2]] (-CurrentDensityC[dexNDIM+cross_lookup[3]][Index].im)/GArray[g].GSq;//FFTfactor;
	3219	sigma_imag[in+dexNDIM][Index].im = GArray[g].G[cross_lookup[0]] ( CurrentDensityC[dexNDIM+cross_lookup[1]][Index].re)/GArray[g].GSq;//FFTfactor;
	3220	sigma_imag[in+dexNDIM][Index].im -= GArray[g].G[cross_lookup[2]] ( CurrentDensityC[dexNDIM+cross_lookup[3]][Index].re)/GArray[g].GSq;//FFTfactor;
	3221	} else { // G=0-component stems from magnetic susceptibility
	3222	sigma_imag[in+dexNDIM][GArray[g].Index].re = 2./3.I->I[0].chi[in+dexNDIM];//-4.M_PI(0.5I->I[0].chi[0+0NDIM]+0.5I->I[0].chi[1+1NDIM]+2./3.I->I[0].chi[2+2*NDIM]);
	3223	}
	3224	for (g=0; g<Lev0->MaxDoubleG; g++) { // apply symmetry
	3225	//if (tempdestRC != (fftw_complex )Dens0->DensityCArray[Temp2Density] \|\| Lev0->DoubleG[2g+1]<0 \|\| Lev0->DoubleG[2*g+1]>=Dens0->LocalSizeC) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
	3226	sigma_imag[in+dexNDIM][Lev0->DoubleG[2g+1]].re = sigma_imag[in+dexNDIM][Lev0->DoubleG[2g]].re;
	3227	sigma_imag[in+dexNDIM][Lev0->DoubleG[2g+1]].im = -sigma_imag[in+dexNDIM][Lev0->DoubleG[2g]].im;
	3228	}
	3229	// fourier transformation of sigma
	3230	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
	3231	fft_3d_complex_to_real(plan, Lev0->LevelNo, FFTNF1, sigma_imag[in+dex*NDIM], work);
	3232
	3233	for (it=0; it < I->Max_Types; it++) { // integration over all types
	3234	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
	3235	// read transformed sigma at core position and MPI_Allreduce
	3236	for (g=0;g<NDIM;g++) {
[f5586e]	3237	n[0][g] = floor(I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g]);
	3238	n[1][g] = ceil(I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g]);
	3239	x[1][g] = I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g] - (double)n[0][g];
[a0bcf1]	3240	x[0][g] = 1. - x[1][g];
	3241	//fprintf(stderr,"(%i) n_floor[%i] = %i\tn_ceil[%i] = %i --- x_floor[%i] = %e\tx_ceil[%i] = %e\n",P->Par.me, g,n[0][g], g,n[1][g], g,x[0][g], g,x[1][g]);
	3242	}
	3243	sigma = 0.;
	3244	for (i=0;i<2;i++) { // interpolate linearly between adjacent grid points per axis
	3245	if ((n[i][0] >= N0myPE) && (n[i][0] < N0(myPE+1))) {
	3246	// fprintf(stderr,"(%i) field[%i]: sigma = %e\n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0*myPE)), sigma);
	3247	sigma += (x[i][0]x[0][1]x[0][2])sigma_real[in+dexNDIM][n[0][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
	3248	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[0][1]x[0][2]), field[n[0][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]*mu0);
	3249	sigma += (x[i][0]x[0][1]x[1][2])sigma_real[in+dexNDIM][n[1][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
	3250	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[0][1]x[1][2]), field[n[1][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]*mu0);
	3251	sigma += (x[i][0]x[1][1]x[0][2])sigma_real[in+dexNDIM][n[0][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
	3252	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[1][1]x[0][2]), field[n[0][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]*mu0);
	3253	sigma += (x[i][0]x[1][1]x[1][2])sigma_real[in+dexNDIM][n[1][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
	3254	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[1][1]x[1][2]), field[n[1][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]*mu0);
	3255	}
	3256	}
	3257	sigma *= -R->FactorDensityR; // factor from inverse fft? (and its defined as negative proportionaly factor)
	3258	MPI_Allreduce ( &sigma, &Sigma, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum local to total
	3259	I->I[it].sigma_rezi[ion][in+dex*NDIM] = Sigma;
	3260	}
	3261	}
	3262	// fabs() all sigma values, as we need them as a positive density: OutputVis plots them in logarithmic scale and
	3263	// thus cannot deal with negative values!
	3264	for (i=0; i< Dens0->LocalSizeR; i++)
	3265	sigma_real[in+dexNDIM][i] = fabs(sigma_real[in+dexNDIM][i]);
	3266	}
	3267	}
	3268	UnLockDensityArray(Dens0,TempDensity,imag); // work
	3269	UnLockDensityArray(Dens0,Temp2Density,imag); // tempdestRC and field
	3270
	3271	// output tensor to file
	3272	if (P->Par.me == 0) {
	3273	sprintf(&suffixsigma[0], ".sigma_chi_rezi.L%i.csv", Lev0->LevelNo);
	3274	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
	3275	fprintf(SigmaFile,"# chemical shielding tensor sigma_rezi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
	3276	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
	3277	for (in=0;in<NDIM;in++)
	3278	for (dex=0;dex<NDIM;dex++)
	3279	fprintf(SigmaFile,"%e\t", GSL_REAL(gsl_matrix_complex_get(H,in,dex)));
	3280	fprintf(SigmaFile,"\n");
	3281	fclose(SigmaFile);
	3282	}
	3283
	3284	gsl_vector *eval = gsl_vector_alloc(NDIM);
	3285	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
	3286
	3287	for (it=0; it < I->Max_Types; it++) { // integration over all types
	3288	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
	3289	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) Shielding Tensor for Ion %i of element %s \\sigma_ij = \n",P->Par.me, ion, I->I[it].Name);
	3290	for (in=0; in<NDIM; in++) { // index i of vector component in integrand
	3291	for (dex=0; dex<NDIM; dex++) {// index j of B component derivation in current density tensor
	3292	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((I->I[it].sigma_rezi[ion][in+dexNDIM]+I->I[it].sigma_rezi[ion][dex+inNDIM])/2.,0));
	3293	if (P->Call.out[ValueOut]) fprintf(stderr,"%e\t", I->I[it].sigma_rezi[ion][in+dex*NDIM]);
	3294	}
	3295	if (P->Call.out[ValueOut]) fprintf(stderr,"\n");
	3296	}
	3297	// output tensor to file
	3298	if (P->Par.me == 0) {
	3299	sprintf(&suffixsigma[0], ".sigma_i%i_%s_rezi.L%i.csv", ion, I->I[it].Symbol, Lev0->LevelNo);
	3300	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
	3301	fprintf(SigmaFile,"# chemical shielding tensor sigma_rezi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
	3302	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
	3303	for (in=0;in<NDIM;in++)
	3304	for (dex=0;dex<NDIM;dex++)
	3305	fprintf(SigmaFile,"%e\t", I->I[it].sigma_rezi[ion][in+dex*NDIM]);
	3306	fprintf(SigmaFile,"\n");
	3307	fclose(SigmaFile);
	3308	}
	3309	// diagonalize sigma
	3310	gsl_eigen_herm(H, eval, w);
	3311	gsl_sort_vector(eval); // sort eigenvalues
	3312	// print eigenvalues
	3313	// if (P->Call.out[ValueOut]) {
	3314	// fprintf(stderr,"(%i) diagonal shielding for Ion %i of element %s:", P->Par.me, ion, I->I[it].Name);
	3315	// for (in=0;in<NDIM;in++)
	3316	// fprintf(stderr,"\t%lg",gsl_vector_get(eval,in));
	3317	// fprintf(stderr,"\n\n");
	3318	// }
	3319	iso = 0.;
	3320	for (i=0;i<NDIM;i++) {
	3321	I->I[it].sigma_rezi_PAS[ion][i] = gsl_vector_get(eval,i);
	3322	iso += I->I[it].sigma_rezi[ion][i+i*NDIM]/3.;
	3323	}
	3324	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
	3325	delta_sigma = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
	3326	S = (delta_sigmadelta_sigma)(1+1./3.etaeta);
	3327	A = 0.;
	3328	for (i=0;i<NDIM;i++) {
	3329	in = cross(i,0);
	3330	dex = cross(i,1);
	3331	A += pow(-1,i)pow(0.5(I->I[it].sigma_rezi[ion][in+dexNDIM]-I->I[it].sigma_rezi[ion][dex+inNDIM]),2);
	3332	}
	3333	if (P->Call.out[ValueOut]) {
	3334	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
	3335	for (i=0;i<NDIM;i++)
	3336	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
	3337	fprintf(stderr,"\nshielding : %e\n", iso);
	3338	fprintf(stderr,"anisotropy : %e\n", delta_sigma);
	3339	fprintf(stderr,"asymmetry : %e\n", eta);
	3340	fprintf(stderr,"S : %e\n", S);
	3341	fprintf(stderr,"A : %e\n", A);
	3342	fprintf(stderr,"==================\n");
	3343
	3344	}
	3345	}
	3346	}
	3347
	3348	// Output of magnetic field densities for each direction
	3349	for (i=0;i<NDIM*NDIM;i++)
	3350	OutputVis(P, sigma_real[i]);
	3351	// Diagonalizing the tensor "field" B_ij [r]
	3352	fprintf(stderr,"(%i) Diagonalizing B_ij [r] ... \n", P->Par.me);
	3353	for (i=0; i< Dens0->LocalSizeR; i++) {
	3354	for (in=0; in<NDIM; in++) // index i of vector component in integrand
	3355	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
	3356	//fprintf(stderr,"(%i) Setting B_(%i,%i)[%i] ... \n", P->Par.me, in,dex,i);
	3357	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((sigma_real[in+dexNDIM][i]+sigma_real[dex+inNDIM][i])/2.,0));
	3358	}
	3359	gsl_eigen_herm(H, eval, w);
	3360	gsl_sort_vector(eval); // sort eigenvalues
	3361	for (in=0;in<NDIM;in++)
	3362	sigma_real[in][i] = gsl_vector_get(eval,in);
	3363	}
	3364	// Output of diagonalized magnetic field densities for each direction
	3365	for (i=0;i<NDIM;i++)
	3366	OutputVis(P, sigma_real[i]);
	3367	for (i=0;i<NDIM*NDIM;i++)
	3368	UnLockDensityArray(Dens0,i,real); // sigma_imag/real free
	3369
	3370	gsl_eigen_herm_free(w);
	3371	gsl_vector_free(eval);
	3372	gsl_matrix_complex_free(H);
	3373	}
	3374
	3375
	3376	/** Calculates the chemical shielding tensor at the positions of the nuclei.
	3377	* The chemical shielding tensor at position R is defined as the proportionality factor between the induced and
	3378	* the externally applied field.
	3379	* \f[
	3380	* \sigma_{ij} (R) = \frac{\delta B_j^{ind} (R)}{\delta B_i^{ext}}
	3381	* = \frac{\mu_0}{4 \pi} \int d^3 r' \left ( \frac{r'-r}{\| r' - r \|^3} \times J_i (r') \right )_j
	3382	* \f]
	3383	* One after another for each nuclear position is the tensor evaluated and the result printed
	3384	* to screen. Tensor is diagonalized afterwards.
	3385	* \param *P Problem at hand
	3386	* \sa CalculateMagneticSusceptibility() - similar calculation, yet without translation to ion centers.
	3387	* \warning This routine is out-dated due to being numerically unstable because of the singularity which is not
	3388	* considered carefully, recommendend replacement is CalculateChemicalShieldingByReciprocalCurrentDensity().
	3389	*/
	3390	void CalculateChemicalShielding(struct Problem *P)
	3391	{
	3392	struct RunStruct *R = &P->R;
	3393	struct Lattice *Lat = &P->Lat;
	3394	struct LatticeLevel *Lev0 = R->Lev0;
	3395	struct Density *Dens0 = R->Lev0->Dens;
	3396	struct Ions *I = &P->Ion;
	3397	double sigma[NDIMNDIM],Sigma[NDIMNDIM];
	3398	fftw_real CurrentDensity[NDIMNDIM];
	3399	int it, ion, in, dex, i0, n[NDIM], n0, i;//, *NUp;
	3400	double x,y,z;
	3401	double dist;
	3402	double r[NDIM], fac[NDIM];
	3403	const double discrete_factor = Lat->Volume/Lev0->MaxN;
	3404	double eta, delta_sigma, S, A, iso;
	3405	const int myPE = P->Par.me_comm_ST_Psi;
	3406	int N[NDIM];
	3407	N[0] = Lev0->Plan0.plan->N[0];
	3408	N[1] = Lev0->Plan0.plan->N[1];
	3409	N[2] = Lev0->Plan0.plan->N[2];
	3410	const int N0 = Lev0->Plan0.plan->local_nx;
	3411	FILE *SigmaFile;
	3412	char suffixsigma[255];
	3413	time_t seconds;
	3414	time(&seconds); // get current time
	3415
	3416	// set pointers onto current density
	3417	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	3418	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	3419	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	3420	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	3421	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	3422	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	3423	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	3424	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	3425	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	3426	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
	3427
	3428	for (it=0; it < I->Max_Types; it++) { // integration over all types
	3429	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
	3430	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) Shielding Tensor for Ion %i of element %s \\sigma_ij = \n",P->Par.me, ion, I->I[it].Name);
	3431	for (in=0; in<NDIM; in++) {// index i of vector component in integrand
	3432	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
	3433	sigma[in+dex*NDIM] = 0.;
	3434
	3435	for(n0=0;n0<N0;n0++) // do the integration over real space
	3436	for(n[1]=0;n[1]<N[1];n[1]++)
	3437	for(n[2]=0;n[2]<N[2];n[2]++) {
	3438	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
	3439	fac[0] = (double)n[0]/(double)N[0];
	3440	fac[1] = (double)n[1]/(double)N[1];
	3441	fac[2] = (double)n[2]/(double)N[2];
	3442	RMat33Vec3(r, Lat->RealBasis, fac);
	3443	i0 = n[2]+N[2](n[1]+N[1](n0)); // the index of current density must match LocalSizeR!
	3444	x = MinImageConv(Lat,r[cross(in,0)], I->I[it].R[NDIM*ion+cross(in,0)],cross(in,0));
	3445	y = MinImageConv(Lat,r[cross(in,2)], I->I[it].R[NDIM*ion+cross(in,2)],cross(in,2));
	3446	z = MinImageConv(Lat,r[in], I->I[it].R[NDIM*ion+in],in); // "in" always is missing third component in cross product
	3447	dist = pow(xx + yy + z*z, 3./2.);
	3448	if ((dist < pow(2.,3.)) && (dist > MYEPSILON)) sigma[in+dexNDIM] += (x CurrentDensity[dexNDIM+cross(in,1)][i0] - y CurrentDensity[dex*NDIM+cross(in,3)][i0])/dist;
	3449	//if (it == 0 && ion == 0) fprintf(stderr,"(%i) sigma[%i][%i] += (%e * %e - %e * %e)/%e = %e\n", P->Par.me, in, dex, x,CurrentDensity[dexNDIM+cross(in,1)][i0],y,CurrentDensity[dexNDIM+cross(in,3)][i0],dist,sigma[in+dex*NDIM]);
	3450	}
	3451	sigma[in+dexNDIM] = -mu0discrete_factor/(4.PI); // due to summation instead of integration
	3452	MPI_Allreduce ( &sigma[in+dexNDIM], &Sigma[in+dexNDIM], 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3453	I->I[it].sigma[ion][in+dexNDIM] = Sigma[in+dexNDIM];
	3454	if (P->Call.out[ValueOut]) fprintf(stderr," %e", Sigma[in+dex*NDIM]);
	3455	}
	3456	if (P->Call.out[ValueOut]) fprintf(stderr,"\n");
	3457	}
	3458	// store symmetrized matrix
	3459	for (in=0;in<NDIM;in++)
	3460	for (dex=0;dex<NDIM;dex++)
	3461	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((Sigma[in+dexNDIM]+Sigma[dex+inNDIM])/2.,0));
	3462	// output tensor to file
	3463	if (P->Par.me == 0) {
	3464	sprintf(&suffixsigma[0], ".sigma_i%i_%s.L%i.csv", ion, I->I[it].Symbol, Lev0->LevelNo);
	3465	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
	3466	fprintf(SigmaFile,"# chemical shielding tensor sigma[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
	3467	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
	3468	for (in=0;in<NDIM*NDIM;in++)
	3469	fprintf(SigmaFile,"%e\t", Sigma[in]);
	3470	fprintf(SigmaFile,"\n");
	3471	fclose(SigmaFile);
	3472	}
	3473	// diagonalize sigma
	3474	gsl_vector *eval = gsl_vector_alloc(NDIM);
	3475	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
	3476	gsl_eigen_herm(H, eval, w);
	3477	gsl_eigen_herm_free(w);
	3478	gsl_sort_vector(eval); // sort eigenvalues
	3479	// print eigenvalues
	3480	// if (P->Call.out[ValueOut]) {
	3481	// fprintf(stderr,"(%i) diagonal shielding for Ion %i of element %s:", P->Par.me, ion, I->I[it].Name);
	3482	// for (in=0;in<NDIM;in++)
	3483	// fprintf(stderr,"\t%lg",gsl_vector_get(eval,in));
	3484	// fprintf(stderr,"\n\n");
	3485	// }
	3486	// print eigenvalues
	3487	iso = 0;
	3488	for (i=0;i<NDIM;i++) {
	3489	I->I[it].sigma[ion][i] = gsl_vector_get(eval,i);
	3490	iso += Sigma[i+i*NDIM]/3.;
	3491	}
	3492	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
	3493	delta_sigma = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
	3494	S = (delta_sigmadelta_sigma)(1+1./3.etaeta);
	3495	A = 0.;
	3496	for (i=0;i<NDIM;i++) {
	3497	in = cross(i,0);
	3498	dex = cross(i,1);
	3499	A += pow(-1,i)pow(0.5(Sigma[in+dexNDIM]-Sigma[dex+inNDIM]),2);
	3500	}
	3501	if (P->Call.out[ValueOut]) {
	3502	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
	3503	for (i=0;i<NDIM;i++)
	3504	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
	3505	fprintf(stderr,"\nshielding : %e\n", iso);
	3506	fprintf(stderr,"anisotropy : %e\n", delta_sigma);
	3507	fprintf(stderr,"asymmetry : %e\n", eta);
	3508	fprintf(stderr,"S : %e\n", S);
	3509	fprintf(stderr,"A : %e\n", A);
	3510	fprintf(stderr,"==================\n");
	3511
	3512	}
	3513	gsl_vector_free(eval);
	3514	}
	3515	}
	3516
	3517	gsl_matrix_complex_free(H);
	3518	}
	3519
	3520	/** Test if integrated current over cell is 0.
	3521	* In most cases we do not reach a numerical sensible zero as in MYEPSILON and remain satisfied as long
	3522	* as the integrated current density is very small (e.g. compared to single entries in the current density array)
	3523	* \param *P Problem at hand
	3524	* \param index index of current component
	3525	* \sa CalculateNativeIntDens() for integration of one current tensor component
	3526	*/
	3527	void TestCurrent(struct Problem *P, const int index)
	3528	{
	3529	struct RunStruct *R = &P->R;
	3530	struct LatticeLevel *Lev0 = R->Lev0;
	3531	struct Density *Dens0 = Lev0->Dens;
	3532	fftw_real CurrentDensity[NDIMNDIM];
	3533	int in;
	3534	double result[NDIM*NDIM], res = 0.;
	3535
	3536	// set pointers onto current density array and get number of grid points in each direction
	3537	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	3538	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	3539	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	3540	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	3541	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	3542	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	3543	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	3544	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	3545	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	3546	for(in=0;in<NDIM;in++) {
	3547	result[in] = CalculateNativeIntDens(P,Lev0,CurrentDensity[in + NDIM*index],R->FactorDensityR);
	3548	res += pow(result[in],2.);
	3549	}
	3550	res = sqrt(res);
	3551	// if greater than 0, complain about it
	3552	if ((res > MYEPSILON) && (P->Call.out[LeaderOut]))
	3553	fprintf(stderr, "(%i) \\int_\\Omega d^3 r j_%i(r) = (%e,%e,%e), %e > %e!\n",P->Par.me, index, result[0], result[1], result[2], res, MYEPSILON);
	3554	}
	3555
	3556	/** Testing whether re<->im switches (due to symmetry) confuses fft.
	3557	* \param *P Problem at hand
	3558	* \param l local wave function number
	3559	*/
	3560	void test_fft_symmetry(struct Problem *P, const int l)
	3561	{
	3562	struct Lattice *Lat = &P->Lat;
	3563	struct RunStruct *R = &P->R;
	3564	struct LatticeLevel *LevS = R->LevS;
	3565	struct LatticeLevel *Lev0 = R->Lev0;
	3566	struct Density *Dens0 = Lev0->Dens;
	3567	struct fft_plan_3d *plan = Lat->plan;
	3568	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityCArray[Temp2Density];
	3569	fftw_complex *work = Dens0->DensityCArray[TempDensity];
	3570	fftw_complex workC = (fftw_complex )Dens0->DensityArray[TempDensity];
	3571	fftw_complex posfac, destpos, destRCS, destRCD;
	3572	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
	3573	fftw_real PsiCR = (fftw_real ) PsiC;
	3574	fftw_complex *Psi0 = LevS->LPsi->LocalPsi[l];
	3575	fftw_complex *dest = LevS->LPsi->TempPsi;
	3576	fftw_real Psi0R = (fftw_real )Dens0->DensityArray[Temp2Density];
	3577	int i,Index, pos, i0, iS,g; //, NoOfPsis = Psi->TypeStartIndex[UnOccupied] - Psi->TypeStartIndex[Occupied];
	3578	int n[NDIM], n0;
	3579	const int N0 = LevS->Plan0.plan->local_nx; // we don't want to build global density, but local
	3580	int N[NDIM], NUp[NDIM];
	3581	N[0] = LevS->Plan0.plan->N[0];
	3582	N[1] = LevS->Plan0.plan->N[1];
	3583	N[2] = LevS->Plan0.plan->N[2];
	3584	NUp[0] = LevS->NUp[0];
	3585	NUp[1] = LevS->NUp[1];
	3586	NUp[2] = LevS->NUp[2];
	3587	//const int k_normal = Lat->Psi.TypeStartIndex[Occupied] + (l - Lat->Psi.TypeStartIndex[R->CurrentMin]);
	3588	//const double *Wcentre = Lat->Psi.AddData[k_normal].WannierCentre;
	3589	//double x[NDIM], fac[NDIM];
	3590	double result1=0., result2=0., result3=0., result4=0.;
	3591	double Result1=0., Result2=0., Result3=0., Result4=0.;
	3592	const double HGcRCFactor = 1./LevS->MaxN; // factor for inverse fft
	3593
	3594
	3595	// fft to real space
	3596	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
	3597	SetArrayToDouble0((double )PsiC, Dens0->TotalSize2);
	3598	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
	3599	Index = LevS->GArray[i].Index;
	3600	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	3601	destpos = &tempdestRC[LevS->MaxNUp*Index];
	3602	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3603	destpos[pos].re = (Psi0[i].re)posfac[pos].re-(Psi0[i].im)posfac[pos].im;
	3604	destpos[pos].im = (Psi0[i].re)posfac[pos].im+(Psi0[i].im)posfac[pos].re;
	3605	//destpos[pos].re = (Psi0[i].im)posfac[pos].re-(-Psi0[i].re)posfac[pos].im;
	3606	//destpos[pos].im = (Psi0[i].im)posfac[pos].im+(-Psi0[i].re)posfac[pos].re;
	3607	}
	3608	}
	3609	for (i=0; i<LevS->MaxDoubleG; i++) {
	3610	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
	3611	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
	3612	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3613	destRCD[pos].re = destRCS[pos].re;
	3614	destRCD[pos].im = -destRCS[pos].im;
	3615	}
	3616	}
	3617	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
	3618	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, Psi0R);
	3619
	3620	// apply position operator and do first result
	3621	for (n0=0;n0<N0;n0++) // only local points on x axis
	3622	for (n[1]=0;n[1]<N[1];n[1]++)
	3623	for (n[2]=0;n[2]<N[2];n[2]++) {
	3624	n[0]=n0 + LevS->Plan0.plan->start_nx; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
	3625	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	3626	iS = n[2]+N[2](n[1]+N[1]n0);
	3627	//x[0] += 1; // shifting expectation value of x coordinate from 0 to 1
	3628	PsiCR[iS] = Psi0R[i0]; // truedist(Lat, x[0], Wcentre[0],0) *
	3629	result1 += PsiCR[iS] * Psi0R[i0];
	3630	}
	3631	result1 /= LevS->MaxN; // factor due to discrete integration
	3632	MPI_Allreduce ( &result1, &Result1, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3633	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 1st result: %e\n",P->Par.me, Result1);
	3634
	3635	// fft to reciprocal space and do second result
	3636	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, PsiC, workC);
	3637	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
	3638	for (g=0; g < LevS->MaxG; g++) {
	3639	Index = LevS->GArray[g].Index;
	3640	dest[g].re = (Psi0[Index].re)*HGcRCFactor;
	3641	dest[g].im = (Psi0[Index].im)*HGcRCFactor;
	3642	}
	3643	result2 = GradSP(P,LevS,Psi0,dest);
	3644	MPI_Allreduce ( &result2, &Result2, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3645	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 2nd result: %e\n",P->Par.me, Result2);
	3646
	3647	// fft again to real space, this time change symmetry
	3648	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
	3649	SetArrayToDouble0((double )PsiC, Dens0->TotalSize2);
	3650	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
	3651	Index = LevS->GArray[i].Index;
	3652	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	3653	destpos = &tempdestRC[LevS->MaxNUp*Index];
	3654	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3655	destpos[pos].re = (Psi0[i].im)posfac[pos].re-(-Psi0[i].re)posfac[pos].im;
	3656	destpos[pos].im = (Psi0[i].im)posfac[pos].im+(-Psi0[i].re)posfac[pos].re;
	3657	}
	3658	}
	3659	for (i=0; i<LevS->MaxDoubleG; i++) {
	3660	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
	3661	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
	3662	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3663	destRCD[pos].re = destRCS[pos].re;
	3664	destRCD[pos].im = -destRCS[pos].im;
	3665	}
	3666	}
	3667	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
	3668	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, Psi0R);
	3669
	3670	// bring down from Lev0 to LevS
	3671	for (n0=0;n0<N0;n0++) // only local points on x axis
	3672	for (n[1]=0;n[1]<N[1];n[1]++)
	3673	for (n[2]=0;n[2]<N[2];n[2]++) {
	3674	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
	3675	iS = n[2]+N[2](n[1]+N[1]n0);
	3676	PsiCR[iS] = Psi0R[i0]; // truedist(Lat, x[0], Wcentre[0],0) *
	3677	result3 += PsiCR[iS] * Psi0R[i0];
	3678	}
	3679	result3 /= LevS->MaxN; // factor due to discrete integration
	3680	MPI_Allreduce ( &result3, &Result3, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3681	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 3rd result: %e\n",P->Par.me, Result3);
	3682
	3683	// fft back to reciprocal space, change symmetry back and do third result
	3684	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, PsiC, workC);
	3685	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
	3686	for (g=0; g < LevS->MaxG; g++) {
	3687	Index = LevS->GArray[g].Index;
	3688	dest[g].re = (-PsiC[Index].im)*HGcRCFactor;
	3689	dest[g].im = ( PsiC[Index].re)*HGcRCFactor;
	3690	}
	3691	result4 = GradSP(P,LevS,Psi0,dest);
	3692	MPI_Allreduce ( &result4, &Result4, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
	3693	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 4th result: %e\n",P->Par.me, Result4);
	3694	}
	3695
	3696
	3697	/** Test function to check RxP application.
	3698	* Checks applied solution to an analytic for a specific and simple wave function -
	3699	* where just one coefficient is unequal to zero.
	3700	* \param *P Problem at hand
	3701	exp(I b G) - I exp(I b G) b G - exp(I a G) + I exp(I a G) a G
	3702	-------------------------------------------------------------
	3703	2
	3704	G
	3705	*/
	3706	void test_rxp(struct Problem *P)
	3707	{
	3708	struct RunStruct *R = &P->R;
	3709	struct Lattice *Lat = &P->Lat;
	3710	//struct LatticeLevel *Lev0 = R->Lev0;
	3711	struct LatticeLevel *LevS = R->LevS;
	3712	struct OneGData *GA = LevS->GArray;
	3713	//struct Density *Dens0 = Lev0->Dens;
	3714	fftw_complex *Psi0 = LevS->LPsi->TempPsi;
	3715	fftw_complex *Psi2 = P->Grad.GradientArray[GraSchGradient];
	3716	fftw_complex *Psi3 = LevS->LPsi->TempPsi2;
	3717	int g, g_bar, i, j, k, k_normal = 0;
	3718	double tmp, a,b, G;
	3719	//const double *Wcentre = Lat->Psi.AddData[k_normal].WannierCentre;
	3720	const double discrete_factor = 1.;//Lat->Volume/LevS->MaxN;
	3721	fftw_complex integral;
	3722
	3723	// reset coefficients
	3724	debug (P,"Creating RxP test function.");
	3725	SetArrayToDouble0((double )Psi0,2R->InitLevS->MaxG);
	3726	SetArrayToDouble0((double )Psi2,2R->InitLevS->MaxG);
	3727
	3728	// pick one which becomes non-zero
	3729	g = 3;
	3730
	3731	//for (g=0;g<LevS->MaxG;g++) {
	3732	Psi0[g].re = 1.;
	3733	Psi0[g].im = 0.;
	3734	//}
	3735	fprintf(stderr,"(%i) G[%i] = (%e,%e,%e) \n",P->Par.me, g, GA[g].G[0], GA[g].G[1], GA[g].G[2]);
	3736	i = 0;
	3737
	3738	// calculate analytic result
	3739	debug (P,"Calculating analytic solution.");
	3740	for (g_bar=0;g_bar<LevS->MaxG;g_bar++) {
	3741	for (g=0;g<LevS->MaxG;g++) {
	3742	if (GA[g].G[i] == GA[g_bar].G[i]) {
	3743	j = cross(i,0);
	3744	k = cross(i,1);
	3745	if (GA[g].G[k] == GA[g_bar].G[k]) {
[f5586e]	3746	//b = truedist(Lat, sqrt(Lat->RealBasisSQ[j]), Wcentre[j], j);
	3747	b = sqrt(Lat->RealBasisSQ[j]);
[a0bcf1]	3748	//a = truedist(Lat, 0., Wcentre[j], j);
	3749	a = 0.;
	3750	G = 1; //GA[g].G[k];
	3751	if (GA[g].G[j] == GA[g_bar].G[j]) {
	3752	Psi2[g_bar].re += GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor;
	3753	Psi2[g_bar].im += GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor;
	3754	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
	3755	//fprintf(stderr,"(%i) Psi[%i].re += %e +i %e\n",P->Par.me, g_bar, GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor, GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor);
	3756	} else {
	3757	tmp = GA[g].G[j]-GA[g_bar].G[j];
	3758	integral.re = (cos(tmpb)+sin(tmpb)btmp - cos(tmpa)-sin(tmpa)atmp) / (tmp * tmp);
	3759	integral.im = (sin(tmpb)-cos(tmpb)btmp - sin(tmpa)+cos(tmpa)atmp) / (tmp * tmp);
	3760	Psi2[g_bar].re += G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor;
	3761	Psi2[g_bar].im += G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor;
	3762	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
	3763	//fprintf(stderr,"(%i) Psi[%i].re += %e\tPsi[%i].im += %e \n",P->Par.me, g_bar, G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor, g_bar, G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor);
	3764	}
	3765	}
	3766	j = cross(i,2);
	3767	k = cross(i,3);
	3768	if (GA[g].G[k] == GA[g_bar].G[k]) {
[f5586e]	3769	//b = truedist(Lat, sqrt(Lat->RealBasisSQ[j]), Wcentre[j], j);
	3770	b = sqrt(Lat->RealBasisSQ[j]);
[a0bcf1]	3771	//a = truedist(Lat, 0., Wcentre[j], j);
	3772	a = 0.;
	3773	G = 1; //GA[g].G[k];
	3774	if (GA[g].G[j] == GA[g_bar].G[j]) {
	3775	Psi2[g_bar].re += GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor;
	3776	Psi2[g_bar].im += GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor;
	3777	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
	3778	//fprintf(stderr,"(%i) Psi[%i].re += %e +i %e\n",P->Par.me, g_bar, GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor, GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor);
	3779	} else {
	3780	tmp = GA[g].G[j]-GA[g_bar].G[j];
	3781	integral.re = (cos(tmpb)+sin(tmpb)btmp - cos(tmpa)-sin(tmpa)atmp) / (tmp * tmp);
	3782	integral.im = (sin(tmpb)-cos(tmpb)btmp - sin(tmpa)+cos(tmpa)atmp) / (tmp * tmp);
	3783	Psi2[g_bar].re += G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor;
	3784	Psi2[g_bar].im += G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor;
	3785	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
	3786	//fprintf(stderr,"(%i) Psi[%i].re += %e\tPsi[%i].im += %e \n",P->Par.me, g_bar, G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor, g_bar, G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor);
	3787	}
	3788	}
	3789	}
	3790	}
	3791	}
	3792
	3793	// apply rxp
	3794	debug (P,"Applying RxP to test function.");
	3795	CalculatePerturbationOperator_RxP(P,Psi0,Psi3,k_normal,i);
	3796
	3797	// compare both coefficient arrays
	3798	debug(P,"Beginning comparison of analytic and Rxp applied solution.");
	3799	for (g=0;g<LevS->MaxG;g++) {
	3800	if ((fabs(Psi3[g].re-Psi2[g].re) >= MYEPSILON) \|\| (fabs(Psi3[g].im-Psi2[g].im) >= MYEPSILON))
	3801	fprintf(stderr,"(%i) Psi3[%i] = %e +i %e != Psi2[%i] = %e +i %e\n",P->Par.me, g, Psi3[g].re, Psi3[g].im, g, Psi2[g].re, Psi2[g].im);
	3802	//else
	3803	//fprintf(stderr,"(%i) Psi1[%i] == Psi2[%i] = %e +i %e\n",P->Par.me, g, g, Psi1[g].re, Psi1[g].im);
	3804	}
	3805	fprintf(stderr,"(%i) <0\|1> = <0\|r\|0> == %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi3), GradImSP(P,LevS,Psi0,Psi3));
	3806	fprintf(stderr,"(%i) <1\|1> = \|r\|ï¿œ == %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi3,Psi3), GradImSP(P,LevS,Psi3,Psi3));
	3807	fprintf(stderr,"(%i) <0\|0> = %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi0), GradImSP(P,LevS,Psi0,Psi0));
	3808	fprintf(stderr,"(%i) <0\|2> = %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi2), GradImSP(P,LevS,Psi0,Psi2));
	3809	}
	3810
	3811
	3812	/** Output of a (X,Y,DX,DY) 2d-vector plot.
	3813	* For a printable representation of the induced current two-dimensional vector plots are useful, as three-dimensional
	3814	* isospheres are sometimes mis-leading or do not represent the desired flow direction. The routine simply extracts a
	3815	* two-dimensional cut orthogonal to one of the lattice axis at a certain node.
	3816	* \param *P Problem at hand
	3817	* \param B_index direction of B field
	3818	* \param n_orth grid node in B_index direction of the plane (the order in which the remaining two coordinate axis
	3819	* appear is the same as in a cross product, which is used to determine orthogonality)
	3820	*/
	3821	void PlotVectorPlane(struct Problem *P, int B_index, int n_orth)
	3822	{
	3823	struct RunStruct *R = &P->R;
	3824	struct LatticeLevel *Lev0 = R->Lev0;
	3825	struct Density *Dens0 = Lev0->Dens;
	3826	char filename[255];
	3827	char *suchpointer;
	3828	FILE *PlotFile = NULL;
	3829	const int myPE = P->Par.me_comm_ST;
	3830	time_t seconds;
	3831	fftw_real CurrentDensity[NDIMNDIM];
	3832	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
	3833	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
	3834	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
	3835	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
	3836	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
	3837	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
	3838	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
	3839	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
	3840	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
	3841	time(&seconds); // get current time
	3842
	3843	if (!myPE) { // only process 0 writes to file
	3844	// open file
	3845	sprintf(&filename[0], ".current.L%i.csv", Lev0->LevelNo);
	3846	OpenFile(P, &PlotFile, filename, "w", P->Call.out[ReadOut]);
	3847	strcpy(filename, ctime(&seconds));
	3848	suchpointer = strchr(filename, '\n');
	3849	if (suchpointer != NULL)
	3850	*suchpointer = '\0';
	3851	if (PlotFile != NULL) {
	3852	fprintf(PlotFile,"# current vector plot of plane perpendicular to direction e_%i at node %i, seed %i, config %s, run on %s, #cpus %i", B_index, n_orth, R->Seed, P->Files.default_path, filename, P->Par.Max_me_comm_ST_Psi);
	3853	fprintf(PlotFile,"\n");
	3854	} else { Error(SomeError, "PlotVectorPlane: Opening Plot File"); }
	3855	}
	3856
	3857	// plot density
	3858	if (!P->Par.me_comm_ST_PsiT) // only first wave function group as current density of all psis was gathered
	3859	PlotRealDensity(P, Lev0, PlotFile, B_index, n_orth, CurrentDensity[B_indexNDIM+cross(B_index,0)], CurrentDensity[B_indexNDIM+cross(B_index,1)]);
	3860
	3861	if (PlotFile != NULL) {
	3862	// close file
	3863	fclose(PlotFile);
	3864	}
	3865	}
	3866
	3867
	3868	/** Reads psi coefficients of \a type from file and transforms to new level.
	3869	* \param *P Problem at hand
	3870	* \param type PsiTypeTag of which minimisation group to load from file
	3871	* \sa ReadSrcPsiDensity() - reading the coefficients, ChangePsiAndDensToLevUp() - transformation to upper level
	3872	*/
	3873	void ReadSrcPerturbedPsis(struct Problem *P, enum PsiTypeTag type)
	3874	{
	3875	struct RunStruct *R = &P->R;
	3876	struct Lattice *Lat = &P->Lat;
	3877	struct LatticeLevel *Lev0 = &P->Lat.Lev[R->Lev0No+1]; // one level higher than current (ChangeLevUp already occurred)
	3878	struct LatticeLevel *LevS = &P->Lat.Lev[R->LevSNo+1];
	3879	struct Density *Dens = Lev0->Dens;
	3880	struct Psis *Psi = &Lat->Psi;
	3881	struct fft_plan_3d *plan = Lat->plan;
	3882	fftw_complex work = (fftw_complex )Dens->DensityCArray[TempDensity];
	3883	fftw_complex tempdestRC = (fftw_complex )Dens->DensityArray[TempDensity];
	3884	fftw_complex posfac, destpos, destRCS, destRCD;
	3885	fftw_complex source, source0;
	3886	int Index,i,pos;
	3887	double factorC = 1./Lev0->MaxN;
	3888	int p,g;
	3889
	3890	// ================= read coefficients from file to LocalPsi ============
	3891	ReadSrcPsiDensity(P, type, 0, R->LevSNo+1);
	3892
	3893	// ================= transform to upper level ===========================
	3894	// for all local Psis do the usual transformation (completing coefficients for all grid vectors, fft, permutation)
	3895	LockDensityArray(Dens, TempDensity, real);
	3896	LockDensityArray(Dens, TempDensity, imag);
	3897	for (p=Psi->LocalNo-1; p >= 0; p--)
	3898	if (Psi->LocalPsiStatus[p].PsiType == type) { // only for the desired type
	3899	source = LevS->LPsi->LocalPsi[p];
	3900	source0 = Lev0->LPsi->LocalPsi[p];
	3901	//fprintf(stderr,"(%i) ReadSrcPerturbedPsis: LevSNo %i\t Lev0No %i\tp %i\t source %p\t source0 %p\n", P->Par.me, LevS->LevelNo, Lev0->LevelNo, p, source, source0);
	3902	SetArrayToDouble0((double )tempdestRC, Dens->TotalSize2);
	3903	for (i=0;i<LevS->MaxG;i++) {
	3904	Index = LevS->GArray[i].Index;
	3905	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
	3906	destpos = &tempdestRC[LevS->MaxNUp*Index];
	3907	//if (isnan(source[i].re)) { fprintf(stderr,"(%i) WARNING in ReadSrcPerturbedPsis(): source_%i[%i] = NaN!\n", P->Par.me, p, i); Error(SomeError, "NaN-Fehler!"); }
	3908	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3909	destpos[pos].re = source[i].reposfac[pos].re-source[i].imposfac[pos].im;
	3910	destpos[pos].im = source[i].reposfac[pos].im+source[i].imposfac[pos].re;
	3911	}
	3912	}
	3913	for (i=0; i<LevS->MaxDoubleG; i++) {
	3914	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
	3915	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
	3916	for (pos=0; pos < LevS->MaxNUp; pos++) {
	3917	destRCD[pos].re = destRCS[pos].re;
	3918	destRCD[pos].im = -destRCS[pos].im;
	3919	}
	3920	}
	3921	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
	3922	DensityRTransformPos(LevS,(fftw_real)tempdestRC,(fftw_real )Dens->DensityCArray[ActualPsiDensity]);
	3923	// now we have density in the upper level, fft back to complex and store it as wave function coefficients
	3924	fft_3d_real_to_complex(plan, Lev0->LevelNo, FFTNF1, Dens->DensityCArray[ActualPsiDensity], work);
	3925	for (g=0; g < Lev0->MaxG; g++) {
	3926	Index = Lev0->GArray[g].Index;
	3927	source0[g].re = Dens->DensityCArray[ActualPsiDensity][Index].re*factorC;
	3928	source0[g].im = Dens->DensityCArray[ActualPsiDensity][Index].im*factorC;
	3929	//if (isnan(source0[g].re)) { fprintf(stderr,"(%i) WARNING in ReadSrcPerturbedPsis(): source0_%i[%i] = NaN!\n", P->Par.me, p, g); Error(SomeError, "NaN-Fehler!"); }
	3930	}
	3931	if (Lev0->GArray[0].GSq == 0.0)
	3932	source0[g].im = 0.0;
	3933	}
	3934	UnLockDensityArray(Dens, TempDensity, real);
	3935	UnLockDensityArray(Dens, TempDensity, imag);
	3936	// finished.
	3937	}

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: pcp/src/perturbed.c@ 88e890

Download in other formats: