Context Navigation

source: pcp/src/perturbed.c@ b0aa9c

Visit:

Last change on this file since b0aa9c was b0aa9c, checked in by Frederik Heber <heber@…>, 18 years ago
MinimisePerturbed(): verbosity changed, some comments
Property mode set to `100644`
File size: 208.8 KB

Line
1	/** \file perturbed.c
2	* Perturbation calculation due to external magnetic field.
3	*
4	* Central function is MinimisePerturbed() wherein the actual minimisation of the two different operators with each
5	* three components takes place subsequently. Helpful routines are CalculatePerturbationOperator_P() - which applies a
6	* specified component of p on the current wave function - and CalculatePerturbationOperator_RxP() - which does the
7	* same for the RxP operator.
8	* The actual minimisation loop FindPerturbedMinimum() depends on the same routines also used for the occupied orbitals,
9	* however with a different energy functional and derivatives, evaluated in Calculate1stPerturbedDerivative() and
10	* Calculate2ndPerturbedDerivative(). InitPerturbedEnergyCalculation() calculates the total energy functional
11	* perturbed in second order for all wave functions, UpdatePerturbedEnergyCalculation() just updates the one
12	* for the wave function after it has been minimised during the line search. Both use CalculatePerturbedEnergy() which
13	* evaluates the energy functional (and the gradient if specified).
14	* Finally, FillCurrentDensity() evaluates the current density at a given point in space using the perturbed
15	* wave functions. Afterwards by calling CalculateMagneticSusceptibility() or
16	* CalculateChemicalShieldingByReciprocalCurrentDensity() susceptibility respectively shielding tensor are possible uses
17	* of this current density.
18	*
19	* There are also some test routines: TestCurrent() checks whether the integrated current is zero in each component.
20	* test_fft_symmetry() tests the "pulling out imaginary unit" before fourier transformation on a given wave function.
21	* CheckOrbitalOverlap() outputs the overlap matrix for the wave functions of a given minimisation state, this might
22	* be important for the additional \f$\Delta J{ij}\f$ contribution to the current density, which is non-zero for
23	* non-zero mutual overlap, which is evaluated if FillDeltaCurrentDensity() is called.
24	*
25	* Finally, there are also some smaller routines: truedist() gives the correct relative distance between two points
26	* in the unit cell under periodic boundary conditions with minimum image convention. ApplyTotalHamiltonian() returns
27	* the hamiltonian applied to a given wave function. sawtooth() is a sawtooth implementation which is needed in order
28	* to avoid flipping of position eigenvalues for nodes close to or on the cell boundary. CalculateOverlap()
29	* is used in the energy functional derivatives, keeping an overlap table between perturbed wave functions up to date.
30	* fft_Psi() is very similar to CalculateOneDensityR(), it does the extension of the wave function to the upper level
31	* RunStruct#Lev0 while fouriertransforming it to real space. cross() gives correct indices in evaluating a vector cross
32	* product. AllocCurrentDensity() and DisAllocCurrentDensity() mark the current density arrays as currently being in use or not.
33	*
34	Project: ParallelCarParrinello
35	\author Frederik Heber
36	\date 2006
37
38	*/
39
40	#include <stdlib.h>
41	#include <stdio.h>
42	#include <math.h>
43	#include <string.h>
44	#include <time.h>
45	#include <gsl/gsl_matrix.h>
46	#include <gsl/gsl_eigen.h>
47	#include <gsl/gsl_complex.h>
48	#include <gsl/gsl_complex_math.h>
49	#include <gsl/gsl_sort_vector.h>
50	#include <gsl/gsl_linalg.h>
51	#include <gsl/gsl_multimin.h>
52
53	#include "data.h"
54	#include "density.h"
55	#include "energy.h"
56	#include "excor.h"
57	#include "errors.h"
58	#include "grad.h"
59	#include "gramsch.h"
60	#include "mergesort2.h"
61	#include "helpers.h"
62	#include "init.h"
63	#include "myfft.h"
64	#include "mymath.h"
65	#include "output.h"
66	#include "pcp.h"
67	#include "perturbed.h"
68	#include "run.h"
69	#include "wannier.h"
70
71
72	/** Minimisation of the PsiTypeTag#Perturbed_RxP0, PsiTypeTag#Perturbed_P0 and other orbitals.
73	* For each of the above PsiTypeTag we go through the following before the minimisation loop:
74	* -# ResetGramSchTagType() resets current type that is to be minimised to NotOrthogonal.
75	* -# UpdateActualPsiNo() steps on to next perturbed of current PsiTypeTag type.
76	* -# GramSch() orthonormalizes perturbed wave functions.
77	* -# TestGramSch() tests if orthonormality was achieved.
78	* -# InitDensityCalculation() gathers densities from all wave functions (and all processes), within SpeedMeasure() DensityTime.
79	* -# InitPerturbedEnergyCalculation() performs initial calculation of the perturbed energy functional.
80	* -# RunStruct#OldActualLocalPsiNo is set to RunStruct#ActualLocalPsiNo, immediately followed by UpdateGramSchOldActualPsiNo()
81	* to bring info on all processes on par.
82	* -# UpdatePerturbedEnergyCalculation() re-calculates Gradient and GradientTypes#H1cGradient for RunStruct#ActualLocalPsiNo
83	* -# EnergyAllReduce() gathers various energy terms and sums up into Energy#TotalEnergy.
84	*
85	* And during the minimisation loop:
86	* -# FindPerturbedMinimum() performs the gradient conjugation, the line search and wave function update.
87	* -# UpdateActualPsiNo() steps on to the next wave function, orthonormalizing by GramSch() if necessary.
88	* -# UpdateEnergyArray() shifts TotalEnergy values to make space for new one.
89	* -# There is no density update as the energy function does not depend on the changing perturbed density but only on the fixed
90	* unperturbed one.
91	* -# UpdatePerturbedEnergyCalculation() re-calculates the perturbed energy of the changed wave function.
92	* -# EnergyAllReduce() gathers energy terms and sums up.
93	* -# CheckCPULIM() checks if external Stop signal has been given.
94	* -# CalculateMinimumStop() checks whether we have dropped below a certain minimum change during minimisation of total energy.
95	* -# finally step counters LatticeLevel#Step and SpeedStruct#Steps are increased.
96	*
97	* After the minimisation loop:
98	* -# SetGramSchExtraPsi() removes extra Psis from orthogonaliy check.
99	* -# ResetGramSchTagType() sets GramSchToDoType to NotUsedtoOrtho.
100	*
101	* And after all minimisation runs are done:
102	* -# UpdateActualPsiNo() steps back to PsiTypeTag#Occupied type.
103	*
104	* At the end we return to Occupied wave functions.
105	* \param *P at hand
106	* \param *Stop flag to determine if epsilon stop conditions have met
107	* \param *SuperStop flag to determinte whether external signal's required end of calculations
108	*/
109	void MinimisePerturbed (struct Problem P, int Stop, int *SuperStop) {
110	struct RunStruct *R = &P->R;
111	struct Lattice *Lat = &P->Lat;
112	struct Psis *Psi = &Lat->Psi;
113	int type;
114
115	for (type=Perturbed_P0;type<=Perturbed_RxP2;type++) { // go through each perturbation group separately //
116	*Stop=0; // reset stop flag
117	if(P->Call.out[LeaderOut]) fprintf(stderr,"(%i)Beginning perturbed minimisation of type %s ...\n", P->Par.me, R->MinimisationName[type]);
118	//OutputOrbitalPositions(P, Occupied);
119	R->PsiStep = R->MaxPsiStep; // reset in-Psi-minimisation-counter, so that we really advance to the next wave function
120	UpdateActualPsiNo(P, type); // step on to next perturbed one
121	if(P->Call.out[MinOut]) fprintf(stderr, "(%i) Re-initializing perturbed psi array for type %s ", P->Par.me, R->MinimisationName[type]);
122	if (P->Call.ReadSrcFiles && ReadSrcPsiDensity(P,type,1, R->LevSNo)) {
123	SpeedMeasure(P, InitSimTime, StartTimeDo);
124	if(P->Call.out[MinOut]) fprintf(stderr,"from source file of recent calculation\n");
125	ReadSrcPsiDensity(P,type, 0, R->LevSNo);
126	ResetGramSchTagType(P, Psi, type, IsOrthogonal); // loaded values are orthonormal
127	SpeedMeasure(P, DensityTime, StartTimeDo);
128	//InitDensityCalculation(P);
129	SpeedMeasure(P, DensityTime, StopTimeDo);
130	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
131	UpdateGramSchOldActualPsiNo(P,Psi);
132	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
133	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
134	EnergyAllReduce(P); // gather energies for minimum search
135	SpeedMeasure(P, InitSimTime, StopTimeDo);
136	}
137	if (P->Call.ReadSrcFiles != 1) {
138	SpeedMeasure(P, InitSimTime, StartTimeDo);
139	ResetGramSchTagType(P, Psi, type, NotOrthogonal); // perturbed now shall be orthonormalized
140	if (P->Call.ReadSrcFiles != 2) {
141	if (R->LevSNo == Lat->MaxLevel-1) { // is it the starting level? (see InitRunLevel())
142	if(P->Call.out[MinOut]) fprintf(stderr, "randomly.\n");
143	InitPsisValue(P, Psi->TypeStartIndex[type], Psi->TypeStartIndex[type+1]); // initialize perturbed array for this run
144	} else {
145	if(P->Call.out[MinOut]) fprintf(stderr, "from source file of last level.\n");
146	ReadSrcPerturbedPsis(P, type);
147	}
148	}
149	SpeedMeasure(P, InitGramSchTime, StartTimeDo);
150	GramSch(P, R->LevS, Psi, Orthogonalize);
151	SpeedMeasure(P, InitGramSchTime, StopTimeDo);
152	SpeedMeasure(P, InitDensityTime, StartTimeDo);
153	//InitDensityCalculation(P);
154	SpeedMeasure(P, InitDensityTime, StopTimeDo);
155	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
156	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
157	UpdateGramSchOldActualPsiNo(P,Psi);
158	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
159	EnergyAllReduce(P); // gather energies for minimum search
160	SpeedMeasure(P, InitSimTime, StopTimeDo);
161	R->LevS->Step++;
162	EnergyOutput(P,0);
163	while (*Stop != 1) {
164	//debug(P,"FindPerturbedMinimum");
165	FindPerturbedMinimum(P); // find minimum
166	//debug(P,"UpdateActualPsiNo");
167	UpdateActualPsiNo(P, type); // step on to next perturbed Psi
168	//debug(P,"UpdateEnergyArray");
169	UpdateEnergyArray(P); // shift energy values in their array by one
170	//debug(P,"UpdatePerturbedEnergyCalculation");
171	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
172	EnergyAllReduce(P); // gather from all processes and sum up to total energy
173	//ControlNativeDensity(P); // check total density (summed up PertMixed must be zero!)
174	//printf ("(%i,%i,%i)S(%i,%i,%i):\t %5d %10.5f\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, (int)iter, s_multi->f);
175	if (*SuperStop != 1)
176	*SuperStop = CheckCPULIM(P);
177	Stop = CalculateMinimumStop(P, SuperStop);
178	P->Speed.Steps++; // step on
179	R->LevS->Step++;
180	}
181	// now release normalization condition and minimize wrt to norm
182	if(P->Call.out[MinOut]) fprintf(stderr,"(%i) Writing %s srcpsi to disk\n", P->Par.me, R->MinimisationName[type]);
183	OutputSrcPsiDensity(P, type);
184	// if (!TestReadnWriteSrcDensity(P,type))
185	// Error(SomeError,"TestReadnWriteSrcDensity failed!");
186	}
187
188	TestGramSch(P,R->LevS,Psi, type); // functions are orthonormal?
189	// calculate current density summands
190	//if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Filling current density grid ...\n",P->Par.me);
191	SpeedMeasure(P, CurrDensTime, StartTimeDo);
192	if (*SuperStop != 1) {
193	if ((R->DoFullCurrent == 1) \|\| ((R->DoFullCurrent == 2) && (CheckOrbitalOverlap(P) == 1))) { //test to check whether orbitals have mutual overlap and thus \\DeltaJ_{xc} must not be dropped
194	R->DoFullCurrent = 1; // set to 1 if it was 2 but Check...() yielded necessity
195	//debug(P,"Filling with Delta j ...");
196	//FillDeltaCurrentDensity(P);
197	}// else
198	//debug(P,"There is no overlap between orbitals.");
199	//debug(P,"Filling with j ...");
200	FillCurrentDensity(P);
201	}
202	SpeedMeasure(P, CurrDensTime, StopTimeDo);
203
204	SetGramSchExtraPsi(P,Psi,NotUsedToOrtho); // remove extra Psis from orthogonality check
205	ResetGramSchTagType(P, Psi, type, NotUsedToOrtho); // remove this group from the check for the next minimisation group as well!
206	}
207	UpdateActualPsiNo(P, Occupied); // step on back to an occupied one
208	}
209
210	/** Tests overlap matrix between each pair of orbitals for non-diagonal form.
211	* We simply check whether the overlap matrix Psis#lambda has off-diagonal entries greater MYEPSILON or not.
212	* \param *P Problem at hand
213	* \note The routine is meant as atest criteria if \f$\Delta J_[ij]\f$ contribution is necessary, as it is only non-zero if
214	* there is mutual overlap between the two orbitals.
215	*/
216	int CheckOrbitalOverlap(struct Problem *P)
217	{
218	struct Lattice *Lat = &P->Lat;
219	struct Psis *Psi = &Lat->Psi;
220	int i,j;
221	int counter = 0;
222
223	// output matrix
224	if (P->Par.me == 0) fprintf(stderr, "(%i) S_ij =\n", P->Par.me);
225	for (i=0;i<Psi->NoOfPsis;i++) {
226	for (j=0;j<Psi->NoOfPsis;j++) {
227	if (fabs(Psi->lambda[i][j]) > MYEPSILON) counter++;
228	if (P->Par.me == 0) fprintf(stderr, "%e\t", Psi->lambda[i][j]); //Overlap[i][j]
229	}
230	if (P->Par.me == 0) fprintf(stderr, "\n");
231	}
232
233	fprintf(stderr, "(%i) CheckOverlap: %i overlaps found.\t", P->Par.me, counter);
234	if (counter > 0) return (1);
235	else return(0);
236	}
237
238	/** Initialization of perturbed energy.
239	* For each local wave function of the current minimisation type RunStruct#CurrentMin it is called:
240	* - CalculateNonLocalEnergyNoRT(): for the coefficient-dependent form factors
241	* - CalculatePerturbedEnergy(): for the perturbed energy, yet without gradient calculation
242	* - CalculateOverlap(): for the overlap between the perturbed wave functions of the current RunStruct#CurrentMin state.
243	*
244	* Afterwards for the two types AllPsiEnergyTypes#Perturbed1_0Energy and AllPsiEnergyTypes#Perturbed0_1Energy the
245	* energy contribution from each wave function is added up in Energy#AllLocalPsiEnergy.
246	* \param *P Problem at hand
247	* \param first state whether it is the first (1) or successive call (0), which avoids some initial calculations.
248	* \sa UpdatePerturbedEnergy()
249	* \note Afterwards EnergyAllReduce() must be called.
250	*/
251	void InitPerturbedEnergyCalculation(struct Problem *P, const int first)
252	{
253	struct Lattice *Lat = &(P->Lat);
254	int p,i;
255	const enum PsiTypeTag state = P->R.CurrentMin;
256	for (p=Lat->Psi.TypeStartIndex[state]; p < Lat->Psi.TypeStartIndex[state+1]; p++) {
257	//if (p < 0 \|\| p >= Lat->Psi.LocalNo) Error(SomeError,"InitPerturbedEnergyCalculation: p out of range");
258	CalculateNonLocalEnergyNoRT(P, p); // recalculating non-local form factors which are coefficient dependent!
259	CalculatePsiEnergy(P,p,1);
260	CalculatePerturbedEnergy(P, p, 0, first);
261	CalculateOverlap(P, p, state);
262	}
263	for (i=0; i<= Perturbed0_1Energy; i++) {
264	Lat->E->AllLocalPsiEnergy[i] = 0.0;
265	for (p=0; p < Lat->Psi.LocalNo; p++)
266	if (P->Lat.Psi.LocalPsiStatus[p].PsiType == state)
267	Lat->E->AllLocalPsiEnergy[i] += Lat->E->PsiEnergy[i][p];
268	}
269	}
270
271
272	/** Updating of perturbed energy.
273	* For current and former (if not the same) local wave function RunStruct#ActualLocal, RunStruct#OldActualLocalPsiNo it is called:
274	* - CalculateNonLocalEnergyNoRT(): for the form factors
275	* - CalculatePerturbedEnergy(): for the perturbed energy, gradient only for RunStruct#ActualLocal
276	* - CalculatePerturbedOverlap(): for the overlap between the perturbed wave functions
277	*
278	* Afterwards for the two types AllPsiEnergyTypes#Perturbed1_0Energy and AllPsiEnergyTypes#Perturbed0_1Energy the
279	* energy contribution from each wave function is added up in Energy#AllLocalPsiEnergy.
280	* \param *P Problem at hand
281	* \sa CalculatePerturbedEnergy() called from here.
282	* \note Afterwards EnergyAllReduce() must be called.
283	*/
284	void UpdatePerturbedEnergyCalculation(struct Problem *P)
285	{
286	struct Lattice *Lat = &(P->Lat);
287	struct Psis *Psi = &Lat->Psi;
288	struct RunStruct *R = &P->R;
289	const enum PsiTypeTag state = R->CurrentMin;
290	int p = R->ActualLocalPsiNo;
291	const int p_old = R->OldActualLocalPsiNo;
292	int i;
293
294	if (p != p_old) {
295	//if (p_old < 0 \|\| p_old >= Lat->Psi.LocalNo) Error(SomeError,"UpdatePerturbedEnergyCalculation: p_old out of range");
296	CalculateNonLocalEnergyNoRT(P, p_old);
297	CalculatePsiEnergy(P,p_old,0);
298	CalculatePerturbedEnergy(P, p_old, 0, 0);
299	CalculateOverlap(P, p_old, state);
300	}
301	//if (p < 0 \|\| p >= Lat->Psi.LocalNo) Error(SomeError,"InitPerturbedEnergyCalculation: p out of range");
302	// recalculating non-local form factors which are coefficient dependent!
303	CalculateNonLocalEnergyNoRT(P,p);
304	CalculatePsiEnergy(P,p,0);
305	CalculatePerturbedEnergy(P, p, 1, 0);
306	CalculateOverlap(P, p, state);
307
308	for (i=0; i<= Perturbed0_1Energy; i++) {
309	Lat->E->AllLocalPsiEnergy[i] = 0.0;
310	for (p=0; p < Psi->LocalNo; p++)
311	if (Psi->LocalPsiStatus[p].PsiType == state)
312	Lat->E->AllLocalPsiEnergy[i] += Lat->E->PsiEnergy[i][p];
313	}
314	}
315
316	/** Calculates gradient and evaluates second order perturbed energy functional for specific wave function.
317	* The in second order perturbed energy functional reads as follows.
318	* \f[
319	* E^{(2)} = \sum_{kl} \langle \varphi_k^{(1)} \| H^{(0)} \delta_{kl} - \lambda_{kl} \| \varphi_l^{(1)} \rangle
320	* + \underbrace{\langle \varphi_l^{(0)} \| H^{(1)} \| \varphi_l^{(1)} \rangle + \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle}_{2 {\cal R} \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle}
321	* \f]
322	* And the gradient
323	* \f[
324	* \widetilde{\varphi}_k^{(1)} = - \sum_l ({\cal H}^{(0)} \delta_{kl} - \lambda_{kl} \| \varphi_l^{(1)} \rangle + {\cal H}^{(1)} \| \varphi_k^{(0)} \rangle
325	* \f]
326	* First, the HGDensity is recalculated if \a first says so - see ApplyTotalHamiltonian().
327	*
328	* Next, we need the perturbation hamiltonian acting on both the respective occupied and current wave function,
329	* see perturbed.c for respective function calls.
330	*
331	* Finally, the scalar product between the wave function and Hc_Gradient yields the eigenvalue of the hamiltonian,
332	* which is summed up over all reciprocal grid vectors and stored in OnePsiElementAddData#Lambda. The Gradient is
333	* the inverse of Hc_Gradient and with the following summation over all perturbed wave functions (MPI exchange of
334	* non-local coefficients) the gradient is computed. Here we need Psis#lambda, which is computed in CalculateHamiltonian().
335	*
336	* Also \f${\cal H}^{(1)} \| \varphi_l^{(0)} \rangle\f$ is stored in GradientTypes#H1cGradient.
337	* \param *P Problem at hand, contains RunStruct, Lattice, LatticeLevel RunStruct#LevS
338	* \param l offset of perturbed wave function within Psi#LocalPsiStatus (\f$\varphi_l^{(1)}\f$)
339	* \param DoGradient (1 = yes, 0 = no) whether gradient shall be calculated or not
340	* \param first recaculate HGDensity (1) or not (0)
341	* \note DensityTypes#ActualPsiDensity must be recent for gradient calculation!
342	* \sa CalculateGradientNoRT() - same procedure for evaluation of \f${\cal H}^{(0)}\| \varphi_l^{(1)} \rangle\f$
343	* \note without the simplification of \f$2 {\cal R} \langle \varphi_l^{(1)} \| H^{(1)} \| \varphi_l^{(0)} \rangle\f$ the
344	* calculation would be impossible due to non-local nature of perturbed wave functions. The position operator would
345	* be impossible to apply in a sensible manner.
346	*/
347	void CalculatePerturbedEnergy(struct Problem *P, const int l, const int DoGradient, const int first)
348	{
349	struct Lattice *Lat = &P->Lat;
350	struct Psis *Psi = &Lat->Psi;
351	struct Energy *E = Lat->E;
352	struct PseudoPot *PP = &P->PP;
353	struct RunStruct *R = &P->R;
354	struct LatticeLevel *LevS = R->LevS;
355	const int state = R->CurrentMin;
356	const int l_normal = Psi->TypeStartIndex[Occupied] + (l - Psi->TypeStartIndex[state]); // offset l to \varphi_l^{(0)}
357	const int ActNum = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[l].my_color_comm_ST_Psi;
358	int g, i, m, j;
359	double lambda, Lambda;
360	double RElambda10, RELambda10;
361	const fftw_complex *source = LevS->LPsi->LocalPsi[l];
362	fftw_complex *grad = P->Grad.GradientArray[ActualGradient];
363	fftw_complex *Hc_grad = P->Grad.GradientArray[HcGradient];
364	fftw_complex *H1c_grad = P->Grad.GradientArray[H1cGradient];
365	fftw_complex *TempPsi_0 = H1c_grad;
366	fftw_complex varphi_1, varphi_0;
367	struct OnePsiElement OnePsiB, LOnePsiB;
368	fftw_complex *LPsiDatB=NULL;
369	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
370	int RecvSource;
371	MPI_Status status;
372
373	// ============ Calculate H^(0) psi^(1) =============================
374	//if (Hc_grad != P->Grad.GradientArray[HcGradient]) Error(SomeError,"CalculatePerturbedEnergy: Hc_grad corrupted");
375	SetArrayToDouble0((double )Hc_grad,2R->InitLevS->MaxG);
376	ApplyTotalHamiltonian(P,source,Hc_grad, PP->fnl[l], 1, first);
377
378	// ============ ENERGY FUNCTIONAL Evaluation PART 1 ================
379	//if (l_normal < 0 \|\| l_normal >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l_normal out of range");
380	varphi_0 = LevS->LPsi->LocalPsi[l_normal];
381	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
382	varphi_1 = LevS->LPsi->LocalPsi[l];
383	//if (TempPsi_0 != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"CalculatePerturbedEnergy: TempPsi_0 corrupted");
384	SetArrayToDouble0((double )TempPsi_0,2R->InitLevS->MaxG);
385	switch (state) {
386	case Perturbed_P0:
387	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,0); // \nabla_0 \| \varphi_l^{(0)} \rangle
388	break;
389	case Perturbed_P1:
390	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,1); // \nabla_1 \| \varphi_l^{(0)} \rangle
391	break;
392	case Perturbed_P2:
393	CalculatePerturbationOperator_P(P,varphi_0,TempPsi_0,2); // \nabla_1 \| \varphi_l^{(0)} \rangle
394	break;
395	case Perturbed_RxP0:
396	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,0); // r \times \nabla \| \varphi_l^{(0)} \rangle
397	break;
398	case Perturbed_RxP1:
399	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,1); // r \times \nabla \| \varphi_l^{(0)} \rangle
400	break;
401	case Perturbed_RxP2:
402	CalculatePerturbationOperator_RxP(P,varphi_0,TempPsi_0,l_normal,2); // r \times \nabla \| \varphi_l^{(0)} \rangle
403	break;
404	default:
405	fprintf(stderr,"(%i) CalculatePerturbedEnergy called whilst not within perturbation run: CurrentMin = %i !\n",P->Par.me, R->CurrentMin);
406	break;
407	}
408
409	// ============ GRADIENT and EIGENVALUE Evaluation Part 1==============
410	lambda = 0.0;
411	if ((DoGradient) && (grad != NULL)) {
412	g = 0;
413	if (LevS->GArray[0].GSq == 0.0) {
414	lambda += Hc_grad[0].re*source[0].re;
415	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
416	grad[0].re = -(Hc_grad[0].re + TempPsi_0[0].re);
417	grad[0].im = -(Hc_grad[0].im + TempPsi_0[0].im);
418	g++;
419	}
420	for (;g<LevS->MaxG;g++) {
421	lambda += 2.(Hc_grad[g].resource[g].re + Hc_grad[g].im*source[g].im);
422	//if (grad != P->Grad.GradientArray[ActualGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
423	grad[g].re = -(Hc_grad[g].re + TempPsi_0[g].re);
424	grad[g].im = -(Hc_grad[g].im + TempPsi_0[g].im);
425	}
426
427	m = -1;
428	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
429	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
430	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
431	m++; // increase m if it is type-specific wave function
432	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
433	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
434	else
435	LOnePsiB = NULL;
436	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
437	RecvSource = OnePsiB->my_color_comm_ST_Psi;
438	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, PerturbedTag, P->Par.comm_ST_PsiT, &status );
439	LPsiDatB=LevS->LPsi->TempPsi;
440	} else { // .. otherwise send it to all other processes (Max_me... - 1)
441	for (i=0;i<P->Par.Max_me_comm_ST_PsiT;i++)
442	if (i != OnePsiB->my_color_comm_ST_Psi)
443	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, i, PerturbedTag, P->Par.comm_ST_PsiT);
444	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
445	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
446
447	g = 0;
448	if (LevS->GArray[0].GSq == 0.0) { // perform the summation
449	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
450	grad[0].re += Lat->Psi.lambda[ActNum][m]*LPsiDatB[0].re;
451	grad[0].im += Lat->Psi.lambda[ActNum][m]*LPsiDatB[0].im;
452	g++;
453	}
454	for (;g<LevS->MaxG;g++) {
455	//if (grad != P->Grad.GradientArray[ActualGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
456	grad[g].re += Lat->Psi.lambda[ActNum][m]*LPsiDatB[g].re;
457	grad[g].im += Lat->Psi.lambda[ActNum][m]*LPsiDatB[g].im;
458	}
459	}
460	}
461	} else {
462	lambda = GradSP(P,LevS,Hc_grad,source);
463	}
464	MPI_Allreduce ( &lambda, &Lambda, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
465	//fprintf(stderr,"(%i) Lambda[%i] = %lg\n",P->Par.me, l, Lambda);
466	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
467	Lat->Psi.AddData[l].Lambda = Lambda;
468
469	// ============ ENERGY FUNCTIONAL Evaluation PART 2 ================
470	// varphi_1 jas negative symmetry, returning TempPsi_0 from CalculatePerturbedOperator also, thus real part of scalar product
471	// "-" due to purely imaginary wave function is on left hand side, thus becomes complex conjugated: i -> -i
472	// (-i goes into pert. op., "-" remains when on right hand side)
473	RElambda10 = GradSP(P,LevS,varphi_1,TempPsi_0) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * Psi->LocalPsiStatus[l_normal].PsiFactor);
474	//RElambda01 = -GradSP(P,LevS,varphi_0,TempPsi_1) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * Psi->LocalPsiStatus[l_normal].PsiFactor);
475
476	MPI_Allreduce ( &RElambda10, &RELambda10, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
477	//MPI_Allreduce ( &RElambda01, &RELambda01, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
478
479	//if (l < 0 \|\| l >= Psi->LocalNo) Error(SomeError,"CalculatePerturbedEnergy: l out of range");
480	E->PsiEnergy[Perturbed1_0Energy][l] = RELambda10;
481	E->PsiEnergy[Perturbed0_1Energy][l] = RELambda10;
482	// if (P->Par.me == 0) {
483	// fprintf(stderr,"RE.Lambda10[%i-%i] = %lg\t RE.Lambda01[%i-%i] = %lg\n", l, l_normal, RELambda10, l_normal, l, RELambda01);
484	// }
485	// GradImSP() is only applicable to a product of wave functions with uneven symmetry!
486	// Otherwise, due to the nature of symmetry, a sum over only half of the coefficients will in most cases not result in zero!
487	}
488
489	/** Applies \f$H^{(0)}\f$ to a given \a source.
490	* The DensityTypes#HGDensity is computed, the exchange potential added and the
491	* whole multiplied - coefficient by coefficient - with the current wave function, taken from its density coefficients,
492	* on the upper LatticeLevel (RunStruct#Lev0), which (DensityTypes#ActualPsiDensity) is updated beforehand.
493	* After an inverse fft (now G-dependent) the non-local potential is added and
494	* within the reciprocal basis set, the kinetic energy can be evaluated easily.
495	* \param *P Problem at hand
496	* \param *source pointer to source coefficient array, \f$\| \varphi(G) \rangle\f$
497	* \param *dest pointer to dest coefficient array,\f$H^{(0)} \| \varphi(G) \rangle\f$
498	* \param **fnl pointer to non-local form factor array
499	* \param PsiFactor occupation number of orbital
500	* \param first 1 - Re-calculate DensityTypes#HGDensity, 0 - don't
501	* \sa CalculateConDirHConDir() - same procedure
502	*/
503	void ApplyTotalHamiltonian(struct Problem P, const fftw_complex source, fftw_complex dest, fftw_complex **fnl, const double PsiFactor, const int first) {
504	struct Lattice *Lat = &P->Lat;
505	struct RunStruct *R = &P->R;
506	struct LatticeLevel *LevS = R->LevS;
507	struct LatticeLevel *Lev0 = R->Lev0;
508	struct Density *Dens0 = Lev0->Dens;
509	struct fft_plan_3d *plan = Lat->plan;
510	struct PseudoPot *PP = &P->PP;
511	struct Ions *I = &P->Ion;
512	fftw_complex *work = Dens0->DensityCArray[TempDensity];
513	fftw_real *HGcR = Dens0->DensityArray[HGcDensity];
514	fftw_complex HGcRC = (fftw_complex)HGcR;
515	fftw_complex *HGC = Dens0->DensityCArray[HGDensity];
516	fftw_real HGCR = (fftw_real )HGC;
517	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
518	fftw_real PsiCR = (fftw_real )PsiC;
519	//const fftw_complex *dest_bak = dest;
520	int nx,ny,nz,iS,i0;
521	const int Nx = LevS->Plan0.plan->local_nx;
522	const int Ny = LevS->Plan0.plan->N[1];
523	const int Nz = LevS->Plan0.plan->N[2];
524	const int NUpx = LevS->NUp[0];
525	const int NUpy = LevS->NUp[1];
526	const int NUpz = LevS->NUp[2];
527	const double HGcRCFactor = 1./LevS->MaxN;
528	int g, Index, i, it;
529	fftw_complex vp,rp,rhog,TotalPsiDensity;
530	double Fac;
531
532	if (first) {
533	// recalculate HGDensity
534	//if (HGC != Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
535	SetArrayToDouble0((double )HGC,2Dens0->TotalSize);
536	g=0;
537	if (Lev0->GArray[0].GSq == 0.0) {
538	Index = Lev0->GArray[0].Index;
539	c_re(vp) = 0.0;
540	c_im(vp) = 0.0;
541	for (it = 0; it < I->Max_Types; it++) {
542	c_re(vp) += (c_re(I->I[it].SFactor[0])*PP->phi_ps_loc[it][0]);
543	c_im(vp) += (c_im(I->I[it].SFactor[0])*PP->phi_ps_loc[it][0]);
544	}
545	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
546	c_re(HGC[Index]) = c_re(vp);
547	c_re(TotalPsiDensity) = c_re(Dens0->DensityCArray[TotalDensity][Index]);
548	c_im(TotalPsiDensity) = c_im(Dens0->DensityCArray[TotalDensity][Index]);
549
550	g++;
551	}
552	for (; g < Lev0->MaxG; g++) {
553	Index = Lev0->GArray[g].Index;
554	Fac = 4.*PI/(Lev0->GArray[g].GSq);
555	c_re(vp) = 0.0;
556	c_im(vp) = 0.0;
557	c_re(rp) = 0.0;
558	c_im(rp) = 0.0;
559	for (it = 0; it < I->Max_Types; it++) {
560	c_re(vp) += (c_re(I->I[it].SFactor[g])*PP->phi_ps_loc[it][g]);
561	c_im(vp) += (c_im(I->I[it].SFactor[g])*PP->phi_ps_loc[it][g]);
562	c_re(rp) += (c_re(I->I[it].SFactor[g])*PP->FacGauss[it][g]);
563	c_im(rp) += (c_im(I->I[it].SFactor[g])*PP->FacGauss[it][g]);
564	} // rp = n^{Gauss)(G)
565
566	// n^{tot} = n^0 + \lambda n^1 + ...
567	//if (isnan(c_re(Dens0->DensityCArray[TotalDensity][Index]))) { fprintf(stderr,"(%i) WARNING in CalculatePerturbedEnergy(): TotalDensity[%i] = NaN!\n", P->Par.me, Index); Error(SomeError, "NaN-Fehler!"); }
568	c_re(TotalPsiDensity) = c_re(Dens0->DensityCArray[TotalDensity][Index]);
569	c_im(TotalPsiDensity) = c_im(Dens0->DensityCArray[TotalDensity][Index]);
570
571	c_re(rhog) = c_re(TotalPsiDensity)*R->HGcFactor+c_re(rp);
572	c_im(rhog) = c_im(TotalPsiDensity)*R->HGcFactor+c_im(rp);
573	// rhog = n(G) + n^{Gauss}(G), rhoe = n(G)
574	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
575	c_re(HGC[Index]) = c_re(vp)+Fac*c_re(rhog);
576	c_im(HGC[Index]) = c_im(vp)+Fac*c_im(rhog);
577	}
578	//
579	for (i=0; i<Lev0->MaxDoubleG; i++) {
580	//if (HGC != Dens0->DensityCArray[HGDensity] \|\| Lev0->DoubleG[2i+1]<0 \|\| Lev0->DoubleG[2i+1]>Dens0->LocalSizeC \|\| Lev0->DoubleG[2i]<0 \|\| Lev0->DoubleG[2i]>Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbedEnergy: grad corrupted");
581	HGC[Lev0->DoubleG[2i+1]].re = HGC[Lev0->DoubleG[2i]].re;
582	HGC[Lev0->DoubleG[2i+1]].im = -HGC[Lev0->DoubleG[2i]].im;
583	}
584	}
585	// ============ GRADIENT and EIGENVALUE Evaluation Part 1==============
586	// \lambda_l^{(1)} = \langle \varphi_l^{(1)} \| H^{(0)} \| \varphi_l^{(1)} \rangle and gradient calculation
587	SpeedMeasure(P, LocTime, StartTimeDo);
588	// back-transform HGDensity: (G) -> (R)
589	//if (HGC != Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
590	if (first) fft_3d_complex_to_real(plan, Lev0->LevelNo, FFTNF1, HGC, work);
591	// evaluate exchange potential with this density, add up onto HGCR
592	//if (HGCR != (fftw_real *)Dens0->DensityCArray[HGDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGCR corrupted");
593	if (first) CalculateXCPotentialNoRT(P, HGCR); // add V^{xc} on V^H + V^{ps}
594	// make sure that ActualPsiDensity is recent
595	CalculateOneDensityR(Lat, LevS, Dens0, source, Dens0->DensityArray[ActualDensity], R->FactorDensityR*PsiFactor, 1);
596	for (nx=0;nx<Nx;nx++)
597	for (ny=0;ny<Ny;ny++)
598	for (nz=0;nz<Nz;nz++) {
599	i0 = nzNUpz+NzNUpz(nyNUpy+NyNUpynx*NUpx);
600	iS = nz+Nz(ny+Nynx);
601	//if (HGcR != Dens0->DensityArray[HGcDensity] \|\| iS<0 \|\| iS>=LevS->Dens->LocalSizeR) Error(SomeError,"ApplyTotalHamiltonian: HGC corrupted");
602	HGcR[iS] = HGCR[i0]PsiCR[i0]; / Matrix Vector Mult */
603	}
604	// (R) -> (G)
605	//if (HGcRC != (fftw_complex *)Dens0->DensityArray[HGcDensity]) Error(SomeError,"ApplyTotalHamiltonian: HGcRC corrupted");
606	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, HGcRC, work);
607	SpeedMeasure(P, LocTime, StopTimeDo);
608	/* NonLocalPP */
609	SpeedMeasure(P, NonLocTime, StartTimeDo);
610	//if (dest != dest_bak) Error(SomeError,"ApplyTotalHamiltonian: dest corrupted");
611	CalculateAddNLPot(P, dest, fnl, PsiFactor); // wave function hidden in form factors fnl, also resets Hc_grad beforehand
612	SpeedMeasure(P, NonLocTime, StopTimeDo);
613
614	/* create final vector */
615	for (g=0;g<LevS->MaxG;g++) {
616	Index = LevS->GArray[g].Index; /* FIXME - factoren */
617	//if (dest != dest_bak \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"ApplyTotalHamiltonian: dest corrupted");
618	dest[g].re += PsiFactor(HGcRC[Index].reHGcRCFactor + 0.5LevS->GArray[g].GSqsource[g].re);
619	dest[g].im += PsiFactor(HGcRC[Index].imHGcRCFactor + 0.5LevS->GArray[g].GSqsource[g].im);
620	}
621	}
622
623	#define stay_above 0.001 //!< value above which the coefficient of the wave function will always remain
624
625	/** Finds the minimum of perturbed energy in regards of actual wave function.
626	* The following happens step by step:
627	* -# The Gradient is copied into GradientTypes#GraSchGradient (which is nothing but a pointer to
628	* one array in LPsiDat) and orthonormalized via GramSch() to all occupied wave functions
629	* except to the current perturbed one.
630	* -# Then comes pre-conditioning, analogous to CalculatePreConGrad().
631	* -# The Gradient is projected onto the current perturbed wave function and this is subtracted, i.e.
632	* vector is the conjugate gradient.
633	* -# Finally, Calculate1stPerturbedDerivative() and Calculate2ndPerturbedDerivative() are called and
634	* with these results and the current total energy, CalculateDeltaI() finds the parameter for the one-
635	* dimensional minimisation. The current wave function is set to newly found minimum and approximated
636	* total energy is printed.
637	*
638	* \param *P Problem at hand
639	* \sa CalculateNewWave() and functions therein
640	*/
641	void FindPerturbedMinimum(struct Problem *P)
642	{
643	struct Lattice *Lat = &P->Lat;
644	struct RunStruct *R = &P->R;
645	struct Psis *Psi = &Lat->Psi;
646	struct PseudoPot *PP = &P->PP;
647	struct LatticeLevel *LevS = R->LevS;
648	struct LatticeLevel *Lev0 = R->Lev0;
649	struct Density *Dens = Lev0->Dens;
650	struct Energy *En = Lat->E;
651	struct FileData *F = &P->Files;
652	int g,p,i;
653	int step = R->PsiStep;
654	double *GammaDiv = &Lat->Psi.AddData[R->ActualLocalPsiNo].Gamma;
655	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
656	fftw_complex *source = LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
657	fftw_complex *grad = P->Grad.GradientArray[ActualGradient];
658	fftw_complex *GradOrtho = P->Grad.GradientArray[GraSchGradient];
659	fftw_complex *PCgrad = P->Grad.GradientArray[PreConGradient];
660	fftw_complex *PCOrtho = P->Grad.GradientArray[GraSchGradient];
661	fftw_complex *ConDir = P->Grad.GradientArray[ConDirGradient];
662	fftw_complex *ConDir_old = P->Grad.GradientArray[OldConDirGradient];
663	fftw_complex *Ortho = P->Grad.GradientArray[GraSchGradient];
664	const fftw_complex *Hc_grad = P->Grad.GradientArray[HcGradient];
665	const fftw_complex *H1c_grad = P->Grad.GradientArray[H1cGradient];
666	fftw_complex *HConDir = Dens->DensityCArray[ActualDensity];
667	const double PsiFactor = Lat->Psi.LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
668	//double Lambda = Lat->Psi.AddData[R->ActualLocalPsiNo].Lambda;
669	double T;
670	double x, K; //, dK;
671	double dS[2], S[2], Gamma, GammaDivOld = *GammaDiv;
672	double LocalSP, PsiSP;
673	double dEdt0, ddEddt0, ConDirHConDir, ConDirConDir;//, sourceHsource;
674	double E0, E, delta;
675	//double E0, E, dE, ddE, delta, dcos, dsin;
676	//double EI, dEI, ddEI, deltaI, dcosI, dsinI;
677	//double HartreeddEddt0, XCddEddt0;
678	double d[4],D[4], Diff;
679	const int Num = Psi->NoOfPsis;
680
681	// ORTHOGONALIZED-GRADIENT
682	for (g=0;g<LevS->MaxG;g++) {
683	//if (GradOrtho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: GradOrtho corrupted");
684	GradOrtho[g].re = grad[g].re; //+Lambda*source[g].re;
685	GradOrtho[g].im = grad[g].im; //+Lambda*source[g].im;
686	}
687	// include the ExtraPsi (which is the GraSchGradient!)
688	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
689	// exclude the minimised Psi
690	SetGramSchActualPsi(P, Psi, NotUsedToOrtho);
691	SpeedMeasure(P, GramSchTime, StartTimeDo);
692	// makes conjugate gradient orthogonal to all other orbits
693	//fprintf(stderr,"CalculateCGGradient: GramSch() for extra orbital\n");
694	GramSch(P, LevS, Psi, Orthogonalize);
695	SpeedMeasure(P, GramSchTime, StopTimeDo);
696	//if (grad != P->Grad.GradientArray[ActualGradient]) Error(SomeError,"FindPerturbedMinimum: grad corrupted");
697	memcpy(grad, GradOrtho, ElementSizeLevS->MaxGsizeof(double));
698	//memcpy(PCOrtho, GradOrtho, ElementSizeLevS->MaxGsizeof(double));
699
700	// PRE-CONDITION-GRADIENT
701	//if (fabs(T) < MYEPSILON) T = 1;
702	T = 0.;
703	for (i=0;i<Num;i++)
704	T += Psi->lambda[i][i];
705	for (g=0;g<LevS->MaxG;g++) {
706	x = .5*LevS->GArray[g].GSq;
707	// FIXME: Good way of accessing reciprocal Lev0 Density coefficients on LevS! (not so trivial)
708	//x += sqrt(Dens->DensityCArray[HGDensity][g].reDens->DensityCArray[HGDensity][g].re+Dens->DensityCArray[HGDensity][g].imDens->DensityCArray[HGDensity][g].im);
709	x -= T/(double)Num;
710	K = x/(xx+stay_abovestay_above);
711	//if (PCOrtho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: PCOrtho corrupted");
712	c_re(PCOrtho[g]) = K*c_re(grad[g]);
713	c_im(PCOrtho[g]) = K*c_im(grad[g]);
714	}
715	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
716	SpeedMeasure(P, GramSchTime, StartTimeDo);
717	// preconditioned direction is orthogonalized
718	//fprintf(stderr,"CalculatePreConGrad: GramSch() for extra orbital\n");
719	GramSch(P, LevS, Psi, Orthogonalize);
720	SpeedMeasure(P, GramSchTime, StopTimeDo);
721	//if (PCgrad != P->Grad.GradientArray[PreConGradient]) Error(SomeError,"FindPerturbedMinimum: PCgrad corrupted");
722	memcpy(PCgrad, PCOrtho, ElementSizeLevS->MaxGsizeof(double));
723
724	//debug(P, "Before ConDir");
725	//fprintf(stderr,"\|(%i)\|^2 = %lg\t \|PCgrad\|^2 = %lg\t \|PCgrad,(%i)\| = %lg\n", R->ActualLocalPsiNo, GradSP(P,LevS,source,source),GradSP(P,LevS,PCgrad,PCgrad), R->ActualLocalPsiNo, GradSP(P,LevS,PCgrad,source));
726	// CONJUGATE-GRADIENT
727	LocalSP = GradSP(P, LevS, PCgrad, grad);
728	MPI_Allreduce ( &LocalSP, &PsiSP, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
729	*GammaDiv = dS[0] = PsiSP;
730	dS[1] = GammaDivOld;
731	S[0]=dS[0]; S[1]=dS[1];
732	/MPI_Allreduce ( dS, S, 2, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_PsiT);/
733	if (step) { // only in later steps is the scalar product used, but always condir stored in oldcondir and Ortho (working gradient)
734	if (fabs(S[1]) < MYEPSILON) fprintf(stderr,"CalculateConDir: S[1] = %lg\n",S[1]);
735	Gamma = S[0]/S[1];
736	if (fabs(S[1]) < MYEPSILON) {
737	if (fabs(S[0]) < MYEPSILON)
738	Gamma = 1.0;
739	else
740	Gamma = 0.0;
741	}
742	for (g=0; g < LevS->MaxG; g++) {
743	//if (ConDir != P->Grad.GradientArray[ConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
744	c_re(ConDir[g]) = c_re(PCgrad[g]) + Gamma*c_re(ConDir_old[g]);
745	c_im(ConDir[g]) = c_im(PCgrad[g]) + Gamma*c_im(ConDir_old[g]);
746	//if (ConDir_old != P->Grad.GradientArray[OldConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir_old corrupted");
747	c_re(ConDir_old[g]) = c_re(ConDir[g]);
748	c_im(ConDir_old[g]) = c_im(ConDir[g]);
749	//if (Ortho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: Ortho corrupted");
750	c_re(Ortho[g]) = c_re(ConDir[g]);
751	c_im(Ortho[g]) = c_im(ConDir[g]);
752	}
753	} else {
754	Gamma = 0.0;
755	for (g=0; g < LevS->MaxG; g++) {
756	//if (ConDir != P->Grad.GradientArray[ConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
757	c_re(ConDir[g]) = c_re(PCgrad[g]);
758	c_im(ConDir[g]) = c_im(PCgrad[g]);
759	//if (ConDir_old != P->Grad.GradientArray[OldConDirGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: ConDir_old corrupted");
760	c_re(ConDir_old[g]) = c_re(ConDir[g]);
761	c_im(ConDir_old[g]) = c_im(ConDir[g]);
762	//if (Ortho != P->Grad.GradientArray[GraSchGradient] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: Ortho corrupted");
763	c_re(Ortho[g]) = c_re(ConDir[g]);
764	c_im(Ortho[g]) = c_im(ConDir[g]);
765	}
766	}
767	// orthonormalize
768	SetGramSchExtraPsi(P, Psi, NotOrthogonal);
769	SpeedMeasure(P, GramSchTime, StartTimeDo);
770	//fprintf(stderr,"CalculateConDir: GramSch() for extra orbital\n");
771	GramSch(P, LevS, Psi, Orthogonalize);
772	SpeedMeasure(P, GramSchTime, StopTimeDo);
773	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
774	memcpy(ConDir, Ortho, ElementSizeLevS->MaxGsizeof(double));
775	//debug(P, "Before LineSearch");
776	//fprintf(stderr,"\|(%i)\|^2 = %lg\t \|ConDir\|^2 = %lg\t \|ConDir,(%i)\| = %lg\n", R->ActualLocalPsiNo, GradSP(P,LevS,source,source),GradSP(P,LevS,ConDir,ConDir), R->ActualLocalPsiNo, GradSP(P,LevS,ConDir,source));
777	SetGramSchActualPsi(P, Psi, IsOrthogonal);
778
779	//fprintf(stderr,"(%i) Testing conjugate gradient for Orthogonality ...\n", P->Par.me);
780	//TestForOrth(P,LevS,ConDir);
781
782	// ONE-DIMENSIONAL LINE-SEARCH
783
784	// ========= dE / dt \| 0 ============
785	p = Lat->Psi.TypeStartIndex[Occupied] + (R->ActualLocalPsiNo - Lat->Psi.TypeStartIndex[R->CurrentMin]);
786	//if (Hc_grad != P->Grad.GradientArray[HcGradient]) Error(SomeError,"FindPerturbedMinimum: Hc_grad corrupted");
787	//if (H1c_grad != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"FindPerturbedMinimum: H1c_grad corrupted");
788	d[0] = Calculate1stPerturbedDerivative(P, LevS->LPsi->LocalPsi[p], source, ConDir, Hc_grad, H1c_grad);
789	//CalculateConDirHConDir(P, ConDir, PsiFactor, &d[1], &d[2], &d[3]);
790	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
791	CalculateCDfnl(P, ConDir, PP->CDfnl); // calculate needed non-local form factors
792	//if (HConDir != Dens->DensityCArray[ActualDensity]) Error(SomeError,"FindPerturbedMinimum: HConDir corrupted");
793	SetArrayToDouble0((double )HConDir,Dens->TotalSize2);
794	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
795	ApplyTotalHamiltonian(P,ConDir,HConDir, PP->CDfnl, PsiFactor, 0); // applies H^(0) with total perturbed density!
796	d[1] = GradSP(P,LevS,ConDir,HConDir);
797	d[2] = GradSP(P,LevS,ConDir,ConDir);
798	d[3] = 0.;
799
800	// gather results
801	MPI_Allreduce ( &d, &D, 4, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
802	// ========== ddE / ddt \| 0 =========
803	dEdt0 = D[0];
804	for (i=MAXOLD-1; i > 0; i--)
805	En->dEdt0[i] = En->dEdt0[i-1];
806	En->dEdt0[0] = dEdt0;
807	ConDirHConDir = D[1];
808	ConDirConDir = D[2];
809	ddEddt0 = 0.0;
810	//if (ConDir != P->Grad.GradientArray[ConDirGradient]) Error(SomeError,"FindPerturbedMinimum: ConDir corrupted");
811	//if (H1c_grad != P->Grad.GradientArray[H1cGradient]) Error(SomeError,"FindPerturbedMinimum: H1c_grad corrupted");
812	ddEddt0 = Calculate2ndPerturbedDerivative(P, LevS->LPsi->LocalPsi[p], source, ConDir, Lat->Psi.AddData[R->ActualLocalPsiNo].Lambda * Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor, ConDirHConDir, ConDirConDir);
813
814	for (i=MAXOLD-1; i > 0; i--)
815	En->ddEddt0[i] = En->ddEddt0[i-1];
816	En->ddEddt0[0] = ddEddt0;
817	E0 = En->TotalEnergy[0];
818	// delta
819	//if (isnan(E0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): E0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
820	//if (isnan(dEdt0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): dEdt0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
821	//if (isnan(ddEddt0)) { fprintf(stderr,"(%i) WARNING in CalculateLineSearch(): ddEddt0_%i[%i] = NaN!\n", P->Par.me, i, 0); Error(SomeError, "NaN-Fehler!"); }
822
823	////deltaI = CalculateDeltaI(E0, dEdt0, ddEddt0,
824	//// &EI, &dEI, &ddEI, &dcosI, &dsinI);
825	////delta = deltaI; E = EI; dE = dEI; ddE = ddEI; dcos = dcosI; dsin = dsinI;
826	if (ddEddt0 > 0) {
827	delta = - dEdt0/ddEddt0;
828	E = E0 + delta * dEdt0 + deltadelta/2. ddEddt0;
829	} else {
830	delta = 0.;
831	E = E0;
832	fprintf(stderr,"(%i) Taylor approximation leads not to minimum!\n",P->Par.me);
833	}
834
835	// shift energy delta values
836	for (i=MAXOLD-1; i > 0; i--) {
837	En->delta[i] = En->delta[i-1];
838	En->ATE[i] = En->ATE[i-1];
839	}
840	// store new one
841	En->delta[0] = delta;
842	En->ATE[0] = E;
843	if (En->TotalEnergy[1] != 0.)
844	Diff = fabs(En->TotalEnergy[1] - E0)/(En->TotalEnergy[1] - E0)*fabs((E0 - En->ATE[1])/E0);
845	else
846	Diff = 0.;
847	R->Diffcount += pow(Diff,2);
848
849	// reinstate actual density (only needed for UpdateDensityCalculation) ...
850	//CalculateOneDensityR(Lat, LevS, Dens, source, Dens->DensityArray[ActualDensity], R->FactorDensityR*Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor, 1);
851	// ... before changing actual local Psi
852	for (g = 0; g < LevS->MaxG; g++) { // Here all coefficients are updated for the new found wave function
853	//if (isnan(ConDir[g].re)) { fprintf(stderr,"WARNGING: CalculateLineSearch(): ConDir_%i(%i) = NaN!\n", R->ActualLocalPsiNo, g); Error(SomeError, "NaN-Fehler!"); }
854	//if (source != LevS->LPsi->LocalPsi[R->ActualLocalPsiNo] \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"FindPerturbedMinimum: source corrupted");
855	////c_re(source[g]) = c_re(source[g])dcos + c_re(ConDir[g])dsin;
856	////c_im(source[g]) = c_im(source[g])dcos + c_im(ConDir[g])dsin;
857	c_re(source[g]) = c_re(source[g]) + c_re(ConDir[g])*delta;
858	c_im(source[g]) = c_im(source[g]) + c_im(ConDir[g])*delta;
859	}
860	if (P->Call.out[StepLeaderOut]) {
861	fprintf(stderr, "(%i,%i,%i)S(%i,%i,%i):\tTE: %e\tATE: %e\t Diff: %e\t --- d: %e\tdEdt0: %e\tddEddt0: %e\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, E0, E, Diff,delta, dEdt0, ddEddt0);
862	//fprintf(stderr, "(%i,%i,%i)S(%i,%i,%i):\tp0: %e p1: %e p2: %e \tATE: %e\t Diff: %e\t --- d: %e\tdEdt0: %e\tddEddt0: %e\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, En->parts[0], En->parts[1], En->parts[2], E, Diff,delta, dEdt0, ddEddt0);
863	}
864	if (P->Par.me == 0) {
865	fprintf(F->MinimisationFile, "%i\t%i\t%i\t%e\t%e\t%e\t%e\t%e\n",R->MinStep, R->ActualLocalPsiNo, R->PsiStep, E0, E, delta, dEdt0, ddEddt0);
866	fflush(F->MinimisationFile);
867	}
868	}
869
870	/** Applies perturbation operator \f$\nabla_{index}\f$ to \a *source.
871	* As wave functions are stored in the reciprocal basis set, the application is straight-forward,
872	* for every G vector, the by \a index specified component is multiplied with the respective
873	* coefficient. Afterwards, 1/i is applied by flipping real and imaginary components (and an additional minus sign on the new imaginary term).
874	* \param *P Problem at hand
875	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
876	* \param *dest returned complex coefficients of wave function \f$\widehat{p}_{index}\|\varphi(G)\f$
877	* \param index_g vectorial index of operator to be applied
878	*/
879	void CalculatePerturbationOperator_P(struct Problem P, const fftw_complex source, fftw_complex *dest, const int index_g)
880	{
881	struct RunStruct *R = &P->R;
882	struct LatticeLevel *LevS = R->LevS;
883	//const fftw_complex *dest_bak = dest;
884	int g = 0;
885	if (LevS->GArray[0].GSq == 0.0) {
886	//if (dest != dest_bak) Error(SomeError,"CalculatePerturbationOperator_P: dest corrupted");
887	dest[0].re = LevS->GArray[0].G[index_g]*source[0].im;
888	dest[0].im = -LevS->GArray[0].G[index_g]*source[0].re;
889	g++;
890	}
891	for (;g<LevS->MaxG;g++) {
892	//if (dest != dest_bak \|\| g<0 \|\| g>=LevS->MaxG) Error(SomeError,"CalculatePerturbationOperator_P: g out of range");
893	dest[g].re = LevS->GArray[g].G[index_g]*source[g].im;
894	dest[g].im = -LevS->GArray[g].G[index_g]*source[g].re;
895	}
896	// don't put dest[0].im = 0! Otherwise real parts of perturbed01/10 are not the same anymore!
897	}
898
899	/** Applies perturbation operator \f$\widehat{r}_{index}\f$ to \a *source.
900	* The \a *source wave function is blown up onto upper level LatticeLevel RunStruct#Lev0, fourier
901	* transformed. Afterwards, for each point on the real mesh the coefficient is multiplied times the real
902	* vector pointing within the cell to the mesh point, yet on LatticeLevel RunStruct#LevS. The new wave
903	* function is inverse fourier transformed and the resulting reciprocal coefficients stored in *dest.
904	* \param *P Problem at hand
905	* \param *source source coefficients
906	* \param *source2 second source coefficients, e.g. in the evaluation of a scalar product
907	* \param *dest destination coefficienta array, is overwrittten!
908	* \param index_r index of real vector.
909	* \param wavenr index of respective PsiTypeTag#Occupied(!) OnePsiElementAddData for the needed Wanner centre of the wave function.
910	*/
911	void CalculatePerturbationOperator_R(struct Problem P, const fftw_complex source, fftw_complex dest, const fftw_complex source2, const int index_r, const int wavenr)
912	{
913	struct Lattice *Lat = &P->Lat;
914	struct RunStruct *R = &P->R;
915	struct LatticeLevel *Lev0 = R->Lev0;
916	struct LatticeLevel *LevS = R->LevS;
917	struct Density *Dens0 = Lev0->Dens;
918	struct fft_plan_3d *plan = Lat->plan;
919	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
920	fftw_real TempPsiR = (fftw_real ) TempPsi;
921	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
922	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
923	fftw_real PsiCR = (fftw_real ) PsiC;
924	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[TempDensity];
925	fftw_complex posfac, destsnd, *destrcv;
926	double x[NDIM], fac[NDIM], Wcentre[NDIM];
927	const int k_normal = Lat->Psi.TypeStartIndex[Occupied] + (wavenr - Lat->Psi.TypeStartIndex[R->CurrentMin]);
928	int n[NDIM], n0, g, Index, pos, iS, i0;
929	int N[NDIM], NUp[NDIM];
930	const int N0 = LevS->Plan0.plan->local_nx;
931	N[0] = LevS->Plan0.plan->N[0];
932	N[1] = LevS->Plan0.plan->N[1];
933	N[2] = LevS->Plan0.plan->N[2];
934	NUp[0] = LevS->NUp[0];
935	NUp[1] = LevS->NUp[1];
936	NUp[2] = LevS->NUp[2];
937	Wcentre[0] = Lat->Psi.AddData[k_normal].WannierCentre[0];
938	Wcentre[1] = Lat->Psi.AddData[k_normal].WannierCentre[1];
939	Wcentre[2] = Lat->Psi.AddData[k_normal].WannierCentre[2];
940	// init pointers and values
941	const int myPE = P->Par.me_comm_ST_Psi;
942	const double FFTFactor = 1./LevS->MaxN;
943	double vector;
944	//double result, Result;
945
946	// blow up source coefficients
947	LockDensityArray(Dens0,TempDensity,real); // tempdestRC
948	LockDensityArray(Dens0,Temp2Density,imag); // TempPsi
949	LockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
950	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
951	SetArrayToDouble0((double )tempdestRC ,Dens0->TotalSize2);
952	//if (TempPsi != Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculatePerturbationOperator_R: TempPsi corrupted");
953	SetArrayToDouble0((double )TempPsi ,Dens0->TotalSize2);
954	//if (PsiC != Dens0->DensityCArray[ActualPsiDensity]) Error(SomeError,"CalculatePerturbationOperator_R: PsiC corrupted");
955	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
956	for (g=0; g<LevS->MaxG; g++) {
957	Index = LevS->GArray[g].Index;
958	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
959	destrcv = &tempdestRC[LevS->MaxNUp*Index];
960	for (pos=0; pos < LevS->MaxNUp; pos++) {
961	//if (destrcv != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbationOperator_R: destrcv corrupted");
962	destrcv [pos].re = (( source[g].re)posfac[pos].re-(source[g].im)posfac[pos].im);
963	destrcv [pos].im = (( source[g].re)posfac[pos].im+(source[g].im)posfac[pos].re);
964	}
965	}
966	for (g=0; g<LevS->MaxDoubleG; g++) {
967	destsnd = &tempdestRC [LevS->DoubleG[2g]LevS->MaxNUp];
968	destrcv = &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp];
969	for (pos=0; pos<LevS->MaxNUp; pos++) {
970	//if (destrcv != &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp] \|\| LevS->DoubleG[2g]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2g]LevS->MaxNUp+pos>=Dens0->LocalSizeC\|\| LevS->DoubleG[2g+1]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2g+1]LevS->MaxNUp+pos>=Dens0->LocalSizeC) Error(SomeError,"CalculatePerturbationOperator_R: destrcv corrupted");
971	destrcv [pos].re = destsnd [pos].re;
972	destrcv [pos].im = -destsnd [pos].im;
973	}
974	}
975	// fourier transform blown up wave function
976	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
977	//if (workC != Dens0->DensityCArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: workC corrupted");
978	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC , workC);
979	//if (tempdestRC != (fftw_complex *)Dens0->DensityArray[TempDensity]) Error(SomeError,"CalculatePerturbationOperator_R: tempdestRC corrupted");
980	//if (TempPsiR != (fftw_real *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculatePerturbationOperator_R: TempPsiR corrupted");
981	DensityRTransformPos(LevS,(fftw_real*)tempdestRC ,TempPsiR );
982	UnLockDensityArray(Dens0,TempDensity,real); // TempdestRC
983
984	//result = 0.;
985	// for every point on the real grid multiply with component of position vector
986	for (n0=0; n0<N0; n0++)
987	for (n[1]=0; n[1]<N[1]; n[1]++)
988	for (n[2]=0; n[2]<N[2]; n[2]++) {
989	n[0] = n0 + N0 * myPE;
990	fac[0] = (double)(n[0])/(double)((N[0]));
991	fac[1] = (double)(n[1])/(double)((N[1]));
992	fac[2] = (double)(n[2])/(double)((N[2]));
993	RMat33Vec3(x,Lat->RealBasis,fac);
994	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
995	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
996	//PsiCR[iS] = ((double)n[0]/(double)N[0]Lat->RealBasis[0] - fabs(Wcentre[0]))TempPsiR[i0] - ((double)n[1]/(double)N[1]Lat->RealBasis[4] - fabs(Wcentre[1]))TempPsi2R[i0];
997	//fprintf(stderr,"(%i) R[%i] = (%lg,%lg,%lg)\n",P->Par.me, i0, x[0], x[1], x[2]);
998	//else fprintf(stderr,"(%i) WCentre[%i] = %e \n",P->Par.me, index_r, Wcentre[index_r]);
999	vector = sawtooth(Lat,MinImageConv(Lat,x[index_r],Wcentre[index_r],index_r),index_r);
1000	//vector = 1.;//sin((double)(n[index_r])/(double)((N[index_r]))2PI);
1001	PsiCR[iS] = vector * TempPsiR[i0];
1002	//fprintf(stderr,"(%i) vector(%i/%i,%i/%i,%i/%i): %lg\tx[%i] = %e\tWcentre[%i] = %e\tTempPsiR[%i] = %e\tPsiCR[%i] = %e\n",P->Par.me, n[0], N[0], n[1], N[1], n[2], N[2], vector, index_r, x[index_r],index_r, Wcentre[index_r],i0,TempPsiR[i0],iS,PsiCR[iS]);
1003
1004	//truedist(Lat,x[cross(index_r,2)],Wcentre[cross(index_r,2)],cross(index_r,2)) * TempPsiR[i0];
1005	//tmp += truedist(Lat,x[index_r],WCentre[index_r],index_r) * RealPhiR[i0];
1006	//tmp += sawtooth(Lat,truedist(Lat,x[index_r],WCentre[index_r],index_r), index_r)*RealPhiR[i0];
1007	//(Fehler mit falschem Ort ist vor dieser Stelle!): ueber result = RealPhiR[i0] * (x[index_r]) * RealPhiR[i0]; gecheckt
1008	//result += TempPsiR[i0] * PsiCR[iS];
1009	}
1010	UnLockDensityArray(Dens0,Temp2Density,imag); // TempPsi
1011	//MPI_Allreduce( &result, &Result, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
1012	//if (P->Par.me == 0) fprintf(stderr,"(%i) PerturbationOpertator_R: %e\n",P->Par.me, Result/LevS->MaxN);
1013	// inverse fourier transform
1014	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
1015	//fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, Psi2C, workC);
1016
1017	// copy to destination array
1018	for (g=0; g<LevS->MaxG; g++) {
1019	Index = LevS->GArray[g].Index;
1020	dest[g].re = ( PsiC[Index].re)*FFTFactor;
1021	dest[g].im = ( PsiC[Index].im)*FFTFactor;
1022	}
1023	UnLockDensityArray(Dens0,ActualPsiDensity,imag); //PsiC
1024	//if (LevS->GArray[0].GSq == 0)
1025	// dest[0].im = 0; // imaginary of G=0 is zero
1026	}
1027	/*
1028	{
1029	struct RunStruct *R = &P->R;
1030	struct LatticeLevel *Lev0 = R->Lev0;
1031	struct LatticeLevel *LevS = R->LevS;
1032	struct Lattice *Lat = &P->Lat;
1033	struct fft_plan_3d *plan = Lat->plan;
1034	struct Density *Dens0 = Lev0->Dens;
1035	fftw_complex *tempdestRC = Dens0->DensityCArray[TempDensity];
1036	fftw_real tempdestR = (fftw_real ) tempdestRC;
1037	fftw_complex *work = Dens0->DensityCArray[Temp2Density];
1038	fftw_complex PsiC = (fftw_complex ) Dens0->DensityCArray[ActualPsiDensity];;
1039	fftw_real PsiCR = (fftw_real ) PsiC;
1040	fftw_real RealPhiR = (fftw_real ) Dens0->DensityArray[Temp2Density];
1041	fftw_complex posfac, destsnd, *destrcv;
1042	double x[NDIM], fac[NDIM], WCentre[NDIM];
1043	int n[NDIM], N0, n0, g, Index, pos, iS, i0;
1044
1045	// init pointers and values
1046	int myPE = P->Par.me_comm_ST_Psi;
1047	double FFTFactor = 1./LevS->MaxN;
1048	int N[NDIM], NUp[NDIM];
1049	N[0] = LevS->Plan0.plan->N[0];
1050	N[1] = LevS->Plan0.plan->N[1];
1051	N[2] = LevS->Plan0.plan->N[2];
1052	NUp[0] = LevS->NUp[0];
1053	NUp[1] = LevS->NUp[1];
1054	NUp[2] = LevS->NUp[2];
1055	N0 = LevS->Plan0.plan->local_nx;
1056	wavenr = Lat->Psi.TypeStartIndex[Occupied] + (wavenr - Lat->Psi.TypeStartIndex[R->CurrentMin]);
1057	Wcentre[0] = Lat->Psi.AddData[wavenr].WannierCentre[0];
1058	Wcentre[1] = Lat->Psi.AddData[wavenr].WannierCentre[1];
1059	Wcentre[2] = Lat->Psi.AddData[wavenr].WannierCentre[2];
1060
1061	// blow up source coefficients
1062	SetArrayToDouble0((double )tempdestRC,Dens0->TotalSize2);
1063	SetArrayToDouble0((double )RealPhiR,Dens0->TotalSize2);
1064	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
1065	for (g=0; g<LevS->MaxG; g++) {
1066	Index = LevS->GArray[g].Index;
1067	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
1068	destrcv = &tempdestRC[LevS->MaxNUp*Index];
1069	for (pos=0; pos<LevS->MaxNUp; pos++) {
1070	destrcv[pos].re = (( source[g].re)posfac[pos].re-( source[g].im)posfac[pos].im);
1071	destrcv[pos].im = (( source[g].re)posfac[pos].im+( source[g].im)posfac[pos].re);
1072	}
1073	}
1074	for (g=0; g<LevS->MaxDoubleG; g++) {
1075	destsnd = &tempdestRC[LevS->DoubleG[2g]LevS->MaxNUp];
1076	destrcv = &tempdestRC[LevS->DoubleG[2g+1]LevS->MaxNUp];
1077	for (pos=0; pos<LevS->MaxNUp; pos++) {
1078	destrcv[pos].re = destsnd[pos].re;
1079	destrcv[pos].im = -destsnd[pos].im;
1080	}
1081	}
1082
1083	// fourier transform blown up wave function
1084	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC, work);
1085	DensityRTransformPos(LevS,tempdestR,RealPhiR);
1086
1087	//fft_Psi(P,source,RealPhiR,0,0);
1088
1089	// for every point on the real grid multiply with component of position vector
1090	for (n0=0; n0<N0; n0++)
1091	for (n[1]=0; n[1]<N[1]; n[1]++)
1092	for (n[2]=0; n[2]<N[2]; n[2]++) {
1093	n[0] = n0 + N0 * myPE;
1094	fac[0] = (double)(n[0])/(double)((N[0]));
1095	fac[1] = (double)(n[1])/(double)((N[1]));
1096	fac[2] = (double)(n[2])/(double)((N[2]));
1097	RMat33Vec3(x,Lat->RealBasis,fac);
1098	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
1099	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
1100	//PsiCR[iS] = (x[index_r]) * RealPhiR[i0]; //- WCentre[index_r]
1101	PsiCR[iS] = truedist(Lat,x[index_r],WCentre[index_r],index_r) * RealPhiR[i0];
1102	//PsiCR[iS] = truedist(Lat,x[index_r],0.,index_r) * RealPhiR[i0];
1103	//PsiCR[iS] = sawtooth(Lat,truedist(Lat,x[index_r],WCentre[index_r],index_r), index_r)*RealPhiR[i0];
1104	//(Fehler mit falschem Ort ist vor dieser Stelle!): ueber result = RealPhiR[i0] * (x[index_r]) * RealPhiR[i0]; gecheckt
1105	}
1106
1107	// inverse fourier transform
1108	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, work);
1109
1110	// copy to destination array
1111	for (g=0; g<LevS->MaxG; g++) {
1112	Index = LevS->GArray[g].Index;
1113	dest[g].re = ( PsiC[Index].re)*FFTFactor;
1114	dest[g].im = ( PsiC[Index].im)*FFTFactor;
1115	if (LevS->GArray[g].GSq == 0)
1116	dest[g].im = 0; // imaginary of G=0 is zero
1117	}
1118	}*/
1119
1120	/** Prints the positions of all unperturbed orbitals to screen.
1121	* \param *P Problem at hand
1122	* \param type PsiTypeTag specifying group of orbitals
1123	* \sa CalculatePerturbationOperator_R()
1124	*/
1125	void OutputOrbitalPositions(struct Problem *P, const enum PsiTypeTag type)
1126	{
1127	struct Lattice *Lat = &P->Lat;
1128	struct Psis *Psi = &Lat->Psi;
1129	struct RunStruct *R = &P->R;
1130	struct LatticeLevel *LevS = R->LevS;
1131	fftw_complex *temp = LevS->LPsi->TempPsi;
1132	fftw_complex *source;
1133	int wavenr, index;
1134	double result[NDIM], Result[NDIM];
1135	//double imsult[NDIM], Imsult[NDIM];
1136	double norm[NDIM], Norm[NDIM];
1137	//double imnorm[NDIM], imNorm[NDIM];
1138	double Wcentre[NDIM];
1139
1140	// for every unperturbed wave function
1141	for (wavenr=Psi->TypeStartIndex[type]; wavenr<Psi->TypeStartIndex[type+1]; wavenr++) {
1142	source = LevS->LPsi->LocalPsi[wavenr];
1143	Wcentre[0] = Psi->AddData[wavenr].WannierCentre[0];
1144	Wcentre[1] = Psi->AddData[wavenr].WannierCentre[1];
1145	Wcentre[2] = Psi->AddData[wavenr].WannierCentre[2];
1146	for (index=0; index<NDIM; index++) {
1147	SetArrayToDouble0((double )temp,2R->InitLevS->MaxG);
1148	// apply position operator
1149	CalculatePerturbationOperator_R(P,source,temp,source,index, wavenr + Psi->TypeStartIndex[R->CurrentMin]);
1150	// take scalar product
1151	result[index] = GradSP(P,LevS,source,temp);
1152	//imsult[index] = GradImSP(P,LevS,source,temp);
1153	norm[index] = GradSP(P,LevS,source,source);
1154	//imnorm[index] = GradImSP(P,LevS,source,source);
1155	MPI_Allreduce( result, Result, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
1156	//MPI_Allreduce( imsult, Imsult, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
1157	MPI_Allreduce( norm, Norm, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
1158	//MPI_Allreduce( imnorm, imNorm, NDIM, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
1159	}
1160	// print output to stderr
1161	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Position of Orbital %i: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0]+Wcentre[0], Result[1]/Norm[1]+Wcentre[1], Result[2]/Norm[2]+Wcentre[2]);
1162	//fprintf(stderr,"(%i) Position of Orbital %i wrt Wannier: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0], Result[1]/Norm[1], Result[2]/Norm[2]);
1163	//fprintf(stderr,"(%i) with Norm: (%e,%e,%e) + i (%e,%e,%e)\n",P->Par.me, Norm[0], Norm[1], Norm[2], imNorm[0], imNorm[1], imNorm[2]);
1164	//if (P->Par.me == 0) fprintf(stderr,"(%i) Position of Orbital %i: (%e,%e,%e)\n",P->Par.me, wavenr, Result[0]/Norm[0], Result[1]/Norm[1], Result[2]/Norm[2]);
1165	}
1166	}
1167
1168	#define borderstart 0.9
1169
1170	/** Applies perturbation operator \f$(\widehat{r} \times \nabla)_{index}\f$ to \a *source.
1171	* The source is fourier-transformed by transforming it to a density (on the next higher level RunStruct#Lev0)
1172	* and at the same time multiply it with the respective component of the reciprocal G vector - the momentum. This
1173	* is done by callinf fft_Psi(). Thus we get \f$\nabla_k \| \varphi (R) \rangle\f$.
1174	*
1175	* Next, we apply the two of three components of the position operator r, which ones stated by cross(), while going
1176	* in a loop through every point of the grid. In order to do this sensibly, truedist() is used to map the coordinates
1177	* onto -L/2...L/2, by subtracting the OneElementPsiAddData#WannierCentre R and wrapping. Also, due to the breaking up
1178	* of the x axis into equally sized chunks for each coefficient sharing process, we need to step only over local
1179	* x-axis grid points, however shift them to the global position when being used as position. In the end, we get
1180	* \f$\epsilon_{index,j,k} (\widehat{r}-R)_j \nabla_k \| \varphi (R) \rangle\f$.
1181	*
1182	* One last fft brings the wave function back to reciprocal basis and it is copied to \a *dest.
1183	* \param *P Problem at hand
1184	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
1185	* \param *dest returned complex coefficients of wave function \f$(\widehat{r} \times \widehat{p})_{index}\|\varphi(G)\rangle\f$
1186	* \param phi0nr number within LocalPsi of the unperturbed pendant of the given perturbed wavefunction \a *source.
1187	* \param index_rxp index desired of the vector product
1188	* \sa CalculateConDirHConDir() - the procedure of fft and inverse fft is very similar.
1189	*/
1190	void CalculatePerturbationOperator_RxP(struct Problem P, const fftw_complex source, fftw_complex *dest, const int phi0nr, const int index_rxp)
1191
1192	{
1193	struct Lattice *Lat = &P->Lat;
1194	struct RunStruct *R = &P->R;
1195	struct LatticeLevel *Lev0 = R->Lev0;
1196	struct LatticeLevel *LevS = R->LevS;
1197	struct Density *Dens0 = Lev0->Dens;
1198	struct fft_plan_3d *plan = Lat->plan;
1199	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
1200	fftw_real TempPsiR = (fftw_real ) TempPsi;
1201	fftw_complex TempPsi2 = (fftw_complex )Dens0->DensityArray[Temp2Density];
1202	fftw_real TempPsi2R = (fftw_real ) TempPsi2;
1203	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
1204	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
1205	fftw_real PsiCR = (fftw_real ) PsiC;
1206	double x[NDIM], fac[NDIM], Wcentre[NDIM];
1207	int n[NDIM], n0, g, Index, iS, i0; //pos,
1208	int N[NDIM], NUp[NDIM];
1209	const int N0 = LevS->Plan0.plan->local_nx;
1210	N[0] = LevS->Plan0.plan->N[0];
1211	N[1] = LevS->Plan0.plan->N[1];
1212	N[2] = LevS->Plan0.plan->N[2];
1213	NUp[0] = LevS->NUp[0];
1214	NUp[1] = LevS->NUp[1];
1215	NUp[2] = LevS->NUp[2];
1216	Wcentre[0] = Lat->Psi.AddData[phi0nr].WannierCentre[0];
1217	Wcentre[1] = Lat->Psi.AddData[phi0nr].WannierCentre[1];
1218	Wcentre[2] = Lat->Psi.AddData[phi0nr].WannierCentre[2];
1219	// init pointers and values
1220	const int myPE = P->Par.me_comm_ST_Psi;
1221	const double FFTFactor = 1./LevS->MaxN; //
1222	// double max[NDIM], max_psi[NDIM];
1223	// double max_n[NDIM];
1224	int index[4];
1225	// double smooth, wall[NDIM];
1226	// for (g=0;g<NDIM;g++) {
1227	// max[g] = 0.;
1228	// max_psi[g] = 0.;
1229	// max_n[g] = -1.;
1230	// }
1231
1232	//fprintf(stderr,"(%i) Wannier[%i] (%2.13e, %2.13e, %2.13e)\n", P->Par.me, phi0nr, 10.-Wcentre[0], 10.-Wcentre[1], 10.-Wcentre[2]);
1233	for (g=0;g<4;g++)
1234	index[g] = cross(index_rxp,g);
1235
1236	// blow up source coefficients
1237	LockDensityArray(Dens0,Temp2Density,imag); // TempPsi
1238	LockDensityArray(Dens0,Temp2Density,real); // TempPsi2
1239	LockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
1240
1241	fft_Psi(P,source,TempPsiR ,index[1],7);
1242	fft_Psi(P,source,TempPsi2R,index[3],7);
1243
1244	//result = 0.;
1245	// for every point on the real grid multiply with component of position vector
1246	for (n0=0; n0<N0; n0++)
1247	for (n[1]=0; n[1]<N[1]; n[1]++)
1248	for (n[2]=0; n[2]<N[2]; n[2]++) {
1249	n[0] = n0 + N0 * myPE;
1250	fac[0] = (double)(n[0])/(double)((N[0]));
1251	fac[1] = (double)(n[1])/(double)((N[1]));
1252	fac[2] = (double)(n[2])/(double)((N[2]));
1253	RMat33Vec3(x,Lat->RealBasis,fac);
1254	// fac[0] = (fac[0] > .9) ? fac[0]-0.9 : 0.;
1255	// fac[1] = (fac[1] > .9) ? fac[1]-0.9 : 0.;
1256	// fac[2] = (fac[2] > .9) ? fac[2]-0.9 : 0.;
1257	// RMat33Vec3(wall,Lat->RealBasis,fac);
1258	// smooth = exp(wall[0]wall[0]+wall[1]wall[1]+wall[2]*wall[2]); // smoothing near the borders of the virtual cell
1259	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
1260	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
1261
1262	// if (fabs(truedist(Lat,x[index[1]],Wcentre[index[1]],index[1])) >= borderstart * sqrt(Lat->RealBasisSQ[index[1]])/2.)
1263	// if (max[index[1]] < sawtooth(Lat,truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]),index[1]) * TempPsiR [i0]) {
1264	// max[index[1]] = sawtooth(Lat,truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]),index[1]) * TempPsiR [i0];
1265	// max_psi[index[1]] = TempPsiR [i0];
1266	// max_n[index[1]] = truedist(Lat,x[index[1]],Wcentre[index[1]],index[1]);
1267	// }
1268	//
1269	// if (fabs(truedist(Lat,x[index[3]],Wcentre[index[3]],index[3])) >= borderstart * sqrt(Lat->RealBasisSQ[index[3]])/2.)
1270	// if (max[index[3]] < sawtooth(Lat,truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]),index[3]) * TempPsiR [i0]) {
1271	// max[index[3]] = sawtooth(Lat,truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]),index[3]) * TempPsiR [i0];
1272	// max_psi[index[3]] = TempPsiR [i0];
1273	// max_n[index[3]] = truedist(Lat,x[index[3]],Wcentre[index[3]],index[3]);
1274	// }
1275
1276	PsiCR[iS] = //vector * TempPsiR[i0];
1277	sawtooth(Lat,MinImageConv(Lat,x[index[0]],Wcentre[index[0]],index[0]),index[0]) * TempPsiR [i0]
1278	-sawtooth(Lat,MinImageConv(Lat,x[index[2]],Wcentre[index[2]],index[2]),index[2]) * TempPsi2R[i0];
1279	// ShiftGaugeOrigin(P,truedist(Lat,x[index[0]],Wcentre[index[0]],index[0]),index[0]) * TempPsiR [i0]
1280	// -ShiftGaugeOrigin(P,truedist(Lat,x[index[2]],Wcentre[index[2]],index[2]),index[2]) * TempPsi2R[i0];
1281	// PsiCR[iS] = (x[index[0]] - Wcentre[index[0]]) * TempPsiR [i0] - (x[index[2]] - Wcentre[index[2]]) * TempPsi2R[i0];
1282	}
1283	//if (P->Par.me == 0) fprintf(stderr,"(%i) PerturbationOpertator_R(xP): %e\n",P->Par.me, Result/LevS->MaxN);
1284	UnLockDensityArray(Dens0,Temp2Density,imag); // TempPsi
1285	UnLockDensityArray(Dens0,Temp2Density,real); // TempPsi2
1286
1287	// // print maximum values
1288	// fprintf (stderr,"(%i) RxP: Maximum values = (",P->Par.me);
1289	// for (g=0;g<NDIM;g++)
1290	// fprintf(stderr,"%lg\t", max[g]);
1291	// fprintf(stderr,"\b)\t(");
1292	// for (g=0;g<NDIM;g++)
1293	// fprintf(stderr,"%lg\t", max_psi[g]);
1294	// fprintf(stderr,"\b)\t");
1295	// fprintf (stderr,"at (");
1296	// for (g=0;g<NDIM;g++)
1297	// fprintf(stderr,"%lg\t", max_n[g]);
1298	// fprintf(stderr,"\b)\n");
1299
1300	// inverse fourier transform
1301	//if (PsiC != Dens0->DensityCArray[ActualPsiDensity]) Error(SomeError,"CalculatePerturbationOperator_RxP: PsiC corrupted");
1302	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
1303
1304	// copy to destination array
1305	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
1306	for (g=0; g<LevS->MaxG; g++) {
1307	Index = LevS->GArray[g].Index;
1308	dest[g].re += ( PsiC[Index].re)*FFTFactor; // factor confirmed, see grad.c:CalculateConDirHConDir()
1309	dest[g].im += ( PsiC[Index].im)*FFTFactor;
1310	//fprintf(stderr,"(%i) PsiC[(%lg,%lg,%lg)] = %lg +i %lg\n", P->Par.me, LevS->GArray[g].G[0], LevS->GArray[g].G[1], LevS->GArray[g].G[2], dest[g].re, dest[g].im);
1311	}
1312	UnLockDensityArray(Dens0,ActualPsiDensity,imag); // PsiC
1313	//if (LevS->GArray[0].GSq == 0.)
1314	//dest[0].im = 0.; // don't do this, see ..._P()
1315	}
1316
1317	/** Applies perturbation operator \f$-(\nabla \times \widehat{r})_{index}\f$ to \a *source.
1318	* Is analogous to CalculatePerturbationOperator_RxP(), only the order is reversed, first position operator, then
1319	* momentum operator
1320	* \param *P Problem at hand
1321	* \param *source complex coefficients of wave function \f$\varphi(G)\f$
1322	* \param *dest returned complex coefficients of wave function \f$(\widehat{r} \times \widehat{p})_{index}\|\varphi(G)\rangle\f$
1323	* \param phi0nr number within LocalPsi of the unperturbed pendant of the given perturbed wavefunction \a *source.
1324	* \param index_pxr index of position operator
1325	* \note Only third component is important due to initial rotiation of cell such that B field is aligned with z axis.
1326	* \sa CalculateConDirHConDir() - the procedure of fft and inverse fft is very similar.
1327	* \bug routine is not tested (but should work), as it offers no advantage over CalculatePerturbationOperator_RxP()
1328	*/
1329	void CalculatePerturbationOperator_PxR(struct Problem P, const fftw_complex source, fftw_complex *dest, const int phi0nr, const int index_pxr)
1330
1331	{
1332	struct Lattice *Lat = &P->Lat;
1333	struct RunStruct *R = &P->R;
1334	struct LatticeLevel *Lev0 = R->Lev0;
1335	struct LatticeLevel *LevS = R->LevS;
1336	struct Density *Dens0 = Lev0->Dens;
1337	struct fft_plan_3d *plan = Lat->plan;
1338	fftw_complex *TempPsi = Dens0->DensityCArray[Temp2Density];
1339	fftw_real TempPsiR = (fftw_real ) TempPsi;
1340	fftw_complex *workC = Dens0->DensityCArray[TempDensity];
1341	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
1342	fftw_real PsiCR = (fftw_real ) PsiC;
1343	fftw_complex *Psi2C = Dens0->DensityCArray[ActualDensity];
1344	fftw_real Psi2CR = (fftw_real ) Psi2C;
1345	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[Temp2Density];
1346	fftw_complex posfac, destsnd, *destrcv;
1347	double x[NDIM], fac[NDIM], Wcentre[NDIM];
1348	int n[NDIM], n0, g, Index, pos, iS, i0;
1349	int N[NDIM], NUp[NDIM];
1350	const int N0 = LevS->Plan0.plan->local_nx;
1351	N[0] = LevS->Plan0.plan->N[0];
1352	N[1] = LevS->Plan0.plan->N[1];
1353	N[2] = LevS->Plan0.plan->N[2];
1354	NUp[0] = LevS->NUp[0];
1355	NUp[1] = LevS->NUp[1];
1356	NUp[2] = LevS->NUp[2];
1357	Wcentre[0] = Lat->Psi.AddData[phi0nr].WannierCentre[0];
1358	Wcentre[1] = Lat->Psi.AddData[phi0nr].WannierCentre[1];
1359	Wcentre[2] = Lat->Psi.AddData[phi0nr].WannierCentre[2];
1360	// init pointers and values
1361	const int myPE = P->Par.me_comm_ST_Psi;
1362	const double FFTFactor = 1./LevS->MaxN;
1363
1364	// blow up source coefficients
1365	SetArrayToDouble0((double )tempdestRC ,Dens0->TotalSize2);
1366	SetArrayToDouble0((double )TempPsi ,Dens0->TotalSize2);
1367	SetArrayToDouble0((double )PsiC,Dens0->TotalSize2);
1368	SetArrayToDouble0((double )Psi2C,Dens0->TotalSize2);
1369	for (g=0; g<LevS->MaxG; g++) {
1370	Index = LevS->GArray[g].Index;
1371	posfac = &LevS->PosFactorUp[LevS->MaxNUp*g];
1372	destrcv = &tempdestRC[LevS->MaxNUp*Index];
1373	for (pos=0; pos < LevS->MaxNUp; pos++) {
1374	destrcv [pos].re = (( source[g].re)posfac[pos].re-( source[g].im)posfac[pos].im);
1375	destrcv [pos].im = (( source[g].re)posfac[pos].im+( source[g].im)posfac[pos].re);
1376	}
1377	}
1378	for (g=0; g<LevS->MaxDoubleG; g++) {
1379	destsnd = &tempdestRC [LevS->DoubleG[2g]LevS->MaxNUp];
1380	destrcv = &tempdestRC [LevS->DoubleG[2g+1]LevS->MaxNUp];
1381	for (pos=0; pos<LevS->MaxNUp; pos++) {
1382	destrcv [pos].re = destsnd [pos].re;
1383	destrcv [pos].im = -destsnd [pos].im;
1384	}
1385	}
1386	// fourier transform blown up wave function
1387	fft_3d_complex_to_real(plan,LevS->LevelNo, FFTNFUp, tempdestRC , workC);
1388	DensityRTransformPos(LevS,(fftw_real*)tempdestRC ,TempPsiR );
1389
1390	//fft_Psi(P,source,TempPsiR ,cross(index_pxr,1),7);
1391	//fft_Psi(P,source,TempPsi2R,cross(index_pxr,3),7);
1392
1393	//result = 0.;
1394	// for every point on the real grid multiply with component of position vector
1395	for (n0=0; n0<N0; n0++)
1396	for (n[1]=0; n[1]<N[1]; n[1]++)
1397	for (n[2]=0; n[2]<N[2]; n[2]++) {
1398	n[0] = n0 + N0 * myPE;
1399	fac[0] = (double)(n[0])/(double)((N[0]));
1400	fac[1] = (double)(n[1])/(double)((N[1]));
1401	fac[2] = (double)(n[2])/(double)((N[2]));
1402	RMat33Vec3(x,Lat->RealBasis,fac);
1403	iS = n[2] + N[2](n[1] + N[1]n0); // mind splitting of x axis due to multiple processes
1404	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
1405	// PsiCR[iS] = sawtooth(Lat,truedist(Lat,x[cross(index_pxr,1)],Wcentre[cross(index_pxr,1)],cross(index_pxr,1)),cross(index_pxr,1)) * TempPsiR[i0];
1406	// Psi2CR[iS] = sawtooth(Lat,truedist(Lat,x[cross(index_pxr,3)],Wcentre[cross(index_pxr,3)],cross(index_pxr,3)),cross(index_pxr,3)) * TempPsiR[i0];
1407	PsiCR[iS] = ShiftGaugeOrigin(P,MinImageConv(Lat,x[cross(index_pxr,1)],Wcentre[cross(index_pxr,1)],cross(index_pxr,1)),cross(index_pxr,1)) * TempPsiR[i0];
1408	Psi2CR[iS] = ShiftGaugeOrigin(P,MinImageConv(Lat,x[cross(index_pxr,3)],Wcentre[cross(index_pxr,3)],cross(index_pxr,3)),cross(index_pxr,3)) * TempPsiR[i0];
1409	}
1410
1411	// inverse fourier transform
1412	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, PsiC, workC);
1413	fft_3d_real_to_complex(plan,LevS->LevelNo, FFTNF1, Psi2C, workC);
1414
1415	// copy to destination array
1416	for (g=0; g<LevS->MaxG; g++) {
1417	Index = LevS->GArray[g].Index;
1418	dest[g].re = -LevS->GArray[g].G[cross(index_pxr,0)]( PsiC[Index].im)FFTFactor;
1419	dest[g].im = -LevS->GArray[g].G[cross(index_pxr,0)](-PsiC[Index].re)FFTFactor;
1420	dest[g].re -= -LevS->GArray[g].G[cross(index_pxr,2)]( Psi2C[Index].im)FFTFactor;
1421	dest[g].im -= -LevS->GArray[g].G[cross(index_pxr,2)](-Psi2C[Index].re)FFTFactor;
1422	}
1423	if (LevS->GArray[0].GSq == 0.)
1424	dest[0].im = 0.; // don't do this, see ..._P()
1425	}
1426
1427	/** Evaluates first derivative of perturbed energy functional with respect to minimisation parameter \f$\Theta\f$.
1428	* \f[
1429	* \frac{\delta {\cal E}^{(2)}} {\delta \Theta} =
1430	* 2 {\cal R} \langle \widetilde{\varphi}_i^{(1)} \| {\cal H}^{(0)} \| \varphi_i^{(1)} \rangle
1431	* - \sum_l \lambda_{il} \langle \widetilde{\varphi}_i^{(1)} \| \varphi_l^{(1)} \rangle
1432	* - \sum_k \lambda_{ki} \langle \varphi_k^{(1)} \| \widetilde{\varphi}_i^{(1)} \rangle
1433	* + 2 {\cal R} \langle \widetilde{\varphi}_i^{(1)} \| {\cal H}^{(1)} \| \varphi_i^{(0)} \rangle
1434	* \f]
1435	*
1436	* The summation over all Psis has again to be done with an MPI exchange of non-local coefficients, as the conjugate
1437	* directions are not the same in situations where PePGamma > 1 (Psis split up among processes = multiple minimisation)
1438	* \param *P Problem at hand
1439	* \param source0 unperturbed wave function \f$\varphi_l^{(0)}\f$
1440	* \param source perturbed wave function \f$\varphi_l^{(1)} (G)\f$
1441	* \param ConDir normalized conjugate direction \f$\widetilde{\varphi}_l^{(1)} (G)\f$
1442	* \param Hc_grad complex coefficients of \f$H^{(0)} \| \varphi_l^{(1)} (G) \rangle\f$, see GradientArray#HcGradient
1443	* \param H1c_grad complex coefficients of \f$H^{(1)} \| \varphi_l^{(0)} (G) \rangle\f$, see GradientArray#H1cGradient
1444	* \sa CalculateLineSearch() - used there, \sa CalculateConDirHConDir() - same principles
1445	* \warning The MPI_Allreduce for the scalar product in the end has not been done and must not have been done for given
1446	* parameters yet!
1447	*/
1448	double Calculate1stPerturbedDerivative(struct Problem P, const fftw_complex source0, const fftw_complex source, const fftw_complex ConDir, const fftw_complex Hc_grad, const fftw_complex H1c_grad)
1449	{
1450	struct RunStruct *R = &P->R;
1451	struct Psis *Psi = &P->Lat.Psi;
1452	struct LatticeLevel *LevS = R->LevS;
1453	double result = 0., E0 = 0., Elambda = 0., E1 = 0.;//, E2 = 0.;
1454	int i,m,j;
1455	const int state = R->CurrentMin;
1456	//const int l_normal = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
1457	const int ActNum = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[R->ActualLocalPsiNo].my_color_comm_ST_Psi;
1458	//int l = R->ActualLocalPsiNo;
1459	//int l_normal = Psi->TypeStartIndex[Occupied] + (l - Psi->TypeStartIndex[state]); // offset l to \varphi_l^{(0)}
1460	struct OnePsiElement OnePsiB, LOnePsiB;
1461	//fftw_complex *HConGrad = LevS->LPsi->TempPsi;
1462	fftw_complex *LPsiDatB=NULL;
1463	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
1464	int RecvSource;
1465	MPI_Status status;
1466
1467	//CalculateCDfnl(P,ConDir,PP->CDfnl);
1468	//ApplyTotalHamiltonian(P,ConDir,HConDir, PP->CDfnl, 1, 0);
1469	//E0 = (GradSP(P, LevS, ConDir, Hc_grad) + GradSP(P, LevS, source, HConDir)) * Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
1470	E0 = 2.GradSP(P, LevS, ConDir, Hc_grad) Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor;
1471	result = E0;
1472	//fprintf(stderr,"(%i) 1st: E0 = \t\t%lg\n", P->Par.me, E0);
1473
1474	m = -1;
1475	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
1476	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
1477	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
1478	m++; // increase m if it is type-specific wave function
1479	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
1480	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
1481	else
1482	LOnePsiB = NULL;
1483	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
1484	RecvSource = OnePsiB->my_color_comm_ST_Psi;
1485	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, PerturbedTag, P->Par.comm_ST_PsiT, &status );
1486	LPsiDatB=LevS->LPsi->TempPsi;
1487	} else { // .. otherwise send it to all other processes (Max_me... - 1)
1488	for (i=0;i<P->Par.Max_me_comm_ST_PsiT;i++)
1489	if (i != OnePsiB->my_color_comm_ST_Psi)
1490	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, i, PerturbedTag, P->Par.comm_ST_PsiT);
1491	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
1492	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
1493
1494	Elambda -= 2.Psi->lambda[ActNum][m]GradSP(P, LevS, ConDir, LPsiDatB) * OnePsiB->PsiFactor; // lambda is symmetric
1495	}
1496	}
1497	result += Elambda;
1498	//fprintf(stderr,"(%i) 1st: Elambda = \t%lg\n", P->Par.me, Elambda);
1499
1500	E1 = 2.GradSP(P,LevS,ConDir,H1c_grad) sqrt(Psi->AllPsiStatus[ActNum].PsiFactor*Psi->LocalPsiStatus[R->ActualLocalPsiNo].PsiFactor);
1501	result += E1;
1502	//fprintf(stderr,"(%i) 1st: E1 = \t\t%lg\n", P->Par.me, E1);
1503
1504	return result;
1505	}
1506
1507
1508	/** Evaluates second derivative of perturbed energy functional with respect to minimisation parameter \f$\Theta\f$.
1509	* \f[
1510	* \frac{\delta^2 {\cal E}^{(2)}} {\delta \Theta^2} =
1511	* 2 \bigl( \langle \widetilde{\varphi}_l^{(1)} \| {\cal H}^{(0)} \| \widetilde{\varphi}_l^{(1)} \rangle
1512	* - \langle \varphi_l^{(1)} \| {\cal H}^{(0)} \| \varphi_l^{(1)} \rangle \bigr )
1513	* + 2 \sum_{i,i \neq l } \lambda_{il} \langle \varphi_i^{(1)} \| \varphi_l^{(1)} \rangle
1514	* - 2 {\cal R} \langle \varphi_l^{(1)} \| {\cal H}^{(1)} \| \varphi_l^{(0)} \rangle
1515	* \f]
1516	*
1517	* The energy eigenvalues of \a ConDir and \a source must be supplied, they can be calculated via CalculateConDirHConDir() and/or
1518	* by the due to CalculatePerturbedEnergy() already present OnePsiElementAddData#Lambda eigenvalue. The summation over the
1519	* unperturbed lambda within the scalar product of perturbed wave functions is evaluated with Psis#lambda and Psis#Overlap.
1520	* Afterwards, the ConDir density is calculated and also the i-th perturbed density to first degree. With these in a sum over
1521	* all real mesh points the exchange-correlation first and second derivatives and also the Hartree potential ones can be calculated
1522	* and summed up.
1523	* \param *P Problem at hand
1524	* \param source0 unperturbed wave function \f$\varphi_l^{(0)}\f$
1525	* \param source wave function \f$\varphi_l^{(1)}\f$
1526	* \param ConDir conjugated direction \f$\widetilde{\varphi}_l^{(1)}\f$
1527	* \param sourceHsource eigenvalue of wave function \f$\langle \varphi_l^{(1)} \| H^{(0)} \| \varphi_l^{(1)}\rangle\f$
1528	* \param ConDirHConDir perturbed eigenvalue of conjugate direction \f$\langle \widetilde{\varphi}_l^{(1)} \| H^{(0)} \| \widetilde{\varphi}_l^{(1)}\rangle\f$
1529	* \param ConDirConDir norm of conjugate direction \f$\langle \widetilde{\varphi}_l^{(1)} \| \widetilde{\varphi}_l^{(1)}\rangle\f$
1530	* \warning No MPI_AllReduce() takes place, parameters have to be reduced already.
1531	*/
1532	double Calculate2ndPerturbedDerivative(struct Problem P, const fftw_complex source0,const fftw_complex source, const fftw_complex ConDir,const double sourceHsource, const double ConDirHConDir, const double ConDirConDir)
1533	{
1534	struct RunStruct *R = &P->R;
1535	struct Psis *Psi = &P->Lat.Psi;
1536	//struct Lattice *Lat = &P->Lat;
1537	//struct Energy *E = Lat->E;
1538	double result = 0.;
1539	double Con0 = 0., Elambda = 0.;//, E0 = 0., E1 = 0.;
1540	//int i;
1541	const int state = R->CurrentMin;
1542	//const int l_normal = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
1543	const int ActNum = R->ActualLocalPsiNo - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[R->ActualLocalPsiNo].my_color_comm_ST_Psi;
1544
1545	Con0 = 2.*ConDirHConDir;
1546	result += Con0;
1547	////E0 = -2.*sourceHsource;
1548	////result += E0;
1549	////E1 = -E->PsiEnergy[Perturbed1_0Energy][R->ActualLocalPsiNo] - E->PsiEnergy[Perturbed0_1Energy][R->ActualLocalPsiNo];
1550	////result += E1;
1551	//fprintf(stderr,"(%i) 2nd: E1 = \t%lg\n", P->Par.me, E1);
1552
1553	////for (i=0;i<Lat->Psi.NoOfPsis;i++) {
1554	//// if (i != ActNum) Elambda += Psi->lambda[i][ActNum]Psi->Overlap[i][ActNum]+ Psi->lambda[ActNum][i]Psi->Overlap[ActNum][i]; // overlap contains PsiFactor
1555	////}
1556	////Elambda = Psi->lambda[ActNum][ActNum]*Psi->Overlap[ActNum][ActNum];
1557	Elambda = 2.Psi->lambda[ActNum][ActNum]ConDirConDir;
1558	result -= Elambda;
1559
1560	//fprintf(stderr,"(%i) 2ndPerturbedDerivative: Result = Con0 + E0 + E1 + Elambda + dEdt0_XC + ddEddt0_XC + dEdt0_H + ddEddt0_H = %lg + %lg + %lg + %lg + %lg + %lg + %lg + %lg = %lg\n", P->Par.me, Con0, E0, E1, Elambda, VolumeFactorRdEdt0_XC, VolumeFactorRddEddt0_XC, dEdt0_H, ddEddt0_H, result);
1561
1562	return (result);
1563	}
1564
1565	/** Returns index of specific component in 3x3 cross product.
1566	* \param i vector product component index, ranging from 0..NDIM
1567	* \param j index specifies which one of the four vectors in xy - yx, ranging from 0..3 (0,1 positive sign, 2,3 negative sign)
1568	* \return Component 0..2 of vector to be taken to evaluate a vector product
1569	* \sa crossed() - is the same but vice versa, return value must be specified, \a i is returned.
1570	*/
1571	inline int cross(int i, int j)
1572	{
1573	const int matrix[NDIM*4] = {1,2,2,1,2,0,0,2,0,1,1,0};
1574	if (i>=0 && i<NDIM && j>=0 && j<4)
1575	return (matrix[i*4+j]);
1576	else {
1577	Error(SomeError,"cross: i or j out of range!");
1578	return (0);
1579	}
1580	}
1581
1582	/** Returns index of resulting vector component in 3x3 cross product.
1583	* In the column specified by the \a j index \a i is looked for and the found row index returned.
1584	* \param i vector component index, ranging from 0..NDIM
1585	* \param j index specifies which one of the four vectors in xy - yx, ranging from 0..3 (0,1 positive sign, 2,3 negative sign)
1586	* \return Component 0..2 of resulting vector
1587	* \sa cross() - is the same but vice versa, return value must be specified, \a i is returned.
1588	*/
1589	inline int crossed(int i, int j)
1590	{
1591	const int matrix[NDIM*4] = {1,2,2,1,2,0,0,2,0,1,1,0};
1592	int k;
1593	if (i>=0 && i<NDIM && j>=0 && j<4) {
1594	for (k=0;k<NDIM;k++)
1595	if (matrix[4*k+j] == i) return(k);
1596	Error(SomeError,"crossed: given component not found!");
1597	return(-1);
1598	} else {
1599	Error(SomeError,"crossed: i or j out of range!");
1600	return (-1);
1601	}
1602	}
1603
1604	#define Nsin 16 //!< should be dependent on MaxG/MaxN per axis!
1605
1606	/** Returns sawtooth shaped profile for position operator within cell.
1607	* This is a mapping from -L/2...L/2 (L = length of unit cell derived from Lattice#RealBasisSQ) to -L/2 to L/2 with a smooth transition:
1608	* \f[
1609	* f(x): x \rightarrow \left \{
1610	* \begin{array}{l}
1611	* -\frac{L}{2} \cdot \sin \left ( \frac{x}{0,05\cdot L} \cdot \frac{\pi}{2} \right ), 0<x<0,05\cdot L \\
1612	* (x - 0,05\cdot L) \cdot \frac{10}{9} - \frac{L}{2}, 0,05\cdot L \leq x<0,95\cdot L \\
1613	* \frac{L}{2} \cdot \cos \left ( \frac{x-0,95\cdot L}{0,05\cdot L} \cdot \frac{\pi}{2} \right), 0,95\cdot L<x<L
1614	* \end{array} \right \}
1615	* \f]
1616	* \param *Lat pointer to Lattice structure for Lattice#RealBasisSQ
1617	* \param L parameter x
1618	* \param index component index for Lattice#RealBasisSQ
1619	*/
1620	inline double sawtooth(struct Lattice *Lat, double L, const int index)
1621	{
1622	double axis = sqrt(Lat->RealBasisSQ[index]);
1623	double sawstart = Lat->SawtoothStart;
1624	double sawend = 1. - sawstart;
1625	double sawfactor = (sawstart+sawend)/(sawend-sawstart);
1626	//return(L);
1627
1628	//fprintf(stderr, "sawstart: %e\tsawend: %e\tsawfactor: %e\tL: %e\n", sawstart, sawend, sawfactor, L);
1629	// transform and return (sawtooth profile checked, 04.08.06)
1630	L += axis/2.; // transform to 0 ... L
1631	if (L < (sawstartaxis)) return (-axis/(2sawfactor)sin(L/(sawstartaxis)*PI/2.)); // first smooth transition from 0 ... -L/2
1632	if (L > (sawendaxis)) return ( axis/(2sawfactor)cos((L-sawendaxis)/(sawstartaxis)PI/2.)); // second smooth transition from +L/2 ... 0
1633	//fprintf(stderr,"L %e\t sawstart %e\t sawend %e\t sawfactor %e\t axis%e\n", L, sawstart, sawend, sawfactor, axis);
1634	//return ((L - sawstartaxis) - axis/(2sawfactor)); // area in between scale to -L/2 ... +L/2
1635	return (L - axis/2); // area in between return as it was
1636	}
1637
1638	/** Shifts the origin of the gauge according to the CSDGT method.
1639	* \f[
1640	* d(r) = r - \sum_{I_s,I_a} (r-R_{I_s,I_a}) exp{(-\alpha_{I_s,I_a}(r-R_{I_s,I_a})^4)}
1641	* \f]
1642	* This trafo is necessary as the current otherweise (CSGT) sensitively depends on the current around
1643	* the core region inadequately/only moderately well approximated by a plane-wave-pseudo-potential-method.
1644	* \param *P Problem at hand, containing Lattice and Ions
1645	* \param r parameter r
1646	* \param index index of the basis vector
1647	* \return \f$d(r)\f$
1648	* \note Continuous Set of Damped Gauge Transformations according to Keith and Bader
1649	*/
1650	inline double ShiftGaugeOrigin(struct Problem *P, double r, const int index)
1651	{
1652	struct Ions *I = &P->Ion;
1653	struct Lattice *Lat = &P->Lat;
1654	double x, tmp;
1655	int is,ia;
1656
1657	// loop over all ions to calculate the sum
1658	x = r;
1659	for (is=0; is < I->Max_Types; is++)
1660	for (ia=0; ia < I->I[is].Max_IonsOfType; ia++) {
1661	tmp = (r - I->I[is].R[NDIM*ia]);
1662	x -= tmpexp(- I->I[is].alpha[ia] tpow(tmp,4));
1663	}
1664
1665	return(sawtooth(Lat,x,index)); // still use sawtooth due to the numerical instability around the border region of the cell
1666	}
1667
1668	/** Print sawtooth() for each node along one axis.
1669	* \param *P Problem at hand, containing RunStruct, Lattice and LatticeLevel RunStruct#LevS
1670	* \param index index of axis
1671	*/
1672	void TestSawtooth(struct Problem *P, const int index)
1673	{
1674	struct RunStruct *R = &P->R;
1675	struct LatticeLevel *LevS = R->LevS;
1676	struct Lattice *Lat =&P->Lat;
1677	double x;
1678	int n;
1679	int N[NDIM];
1680	N[0] = LevS->Plan0.plan->N[0];
1681	N[1] = LevS->Plan0.plan->N[1];
1682	N[2] = LevS->Plan0.plan->N[2];
1683
1684	for (n=0;n<N[index];n++) {
1685	x = (double)n/(double)N[index] * sqrt(Lat->RealBasisSQ[index]);
1686	//fprintf(stderr,"(%i) x %e\t Axis/2 %e\n",P->Par.me, x, sqrt(Lat->RealBasisSQ[index])/2. );
1687	x = MinImageConv(Lat, x, sqrt(Lat->RealBasisSQ[index])/2., index);
1688	fprintf(stderr,"%e\t%e\n", x, sawtooth(Lat,x,index));
1689	}
1690	}
1691
1692	/** Secures minimum image convention between two given points \a R[] and \a r[] within periodic boundary.
1693	* Each distance component within a periodic boundary must always be between -L/2 ... L/2
1694	* \param *Lat pointer to Lattice structure
1695	* \param R[] first vector, NDIM, each must be between 0...L
1696	* \param r[] second vector, NDIM, each must be between 0...L
1697	* \param index of component
1698	* \return component between -L/2 ... L/2
1699	*/
1700	inline double MinImageConv(struct Lattice *Lat, const double R, const double r, const int index)
1701	{
1702	double axis = sqrt(Lat->RealBasisSQ[index]);
1703	double result = 0.;
1704
1705	if (fabs(result = R - r + axis) < axis/2.) { }
1706	else if (fabs(result = R - r) <= axis/2.) { }
1707	else if (fabs(result = R - r - axis) < axis/2.) { }
1708	else Error(SomeError, "MinImageConv: None of the three cases applied!");
1709	return (result);
1710	}
1711
1712
1713	/** Fouriertransforms given \a source.
1714	* By the use of the symmetry parameter an additional imaginary unit and/or the momentum operator can
1715	* be applied at the same time.
1716	* \param *P Problem at hand
1717	* \param *Psi source array of reciprocal coefficients
1718	* \param *PsiR destination array, becoming filled with real coefficients
1719	* \param index_g component of G vector (only needed for symmetry=4..7)
1720	* \param symmetry 0 - do nothing, 1 - factor by "-1", 2 - factor by "i", 3 - factor by "1/i = -i", from 4 to 7 the same
1721	* but additionally with momentum operator
1722	*/
1723	void fft_Psi(struct Problem P, const fftw_complex Psi, fftw_real *PsiR, const int index_g, const int symmetry)
1724	{
1725	struct Lattice *Lat = &P->Lat;
1726	struct RunStruct *R = &P->R;
1727	struct LatticeLevel *Lev0 = R->Lev0;
1728	struct LatticeLevel *LevS = R->LevS;
1729	struct Density *Dens0 = Lev0->Dens;
1730	struct fft_plan_3d *plan = Lat->plan;
1731	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityArray[TempDensity];
1732	fftw_complex *work = Dens0->DensityCArray[TempDensity];
1733	fftw_complex posfac, destpos, destRCS, destRCD;
1734	int i, Index, pos;
1735
1736	LockDensityArray(Dens0,TempDensity,imag); // tempdestRC
1737	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
1738	SetArrayToDouble0((double )PsiR, Dens0->TotalSize2);
1739	switch (symmetry) {
1740	case 0:
1741	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
1742	Index = LevS->GArray[i].Index;
1743	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1744	destpos = &tempdestRC[LevS->MaxNUp*Index];
1745	for (pos=0; pos < LevS->MaxNUp; pos++) {
1746	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1747	destpos[pos].re = (Psi[i].re)posfac[pos].re-(Psi[i].im)posfac[pos].im;
1748	destpos[pos].im = (Psi[i].re)posfac[pos].im+(Psi[i].im)posfac[pos].re;
1749	}
1750	}
1751	break;
1752	case 1:
1753	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is - positive
1754	Index = LevS->GArray[i].Index;
1755	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1756	destpos = &tempdestRC[LevS->MaxNUp*Index];
1757	for (pos=0; pos < LevS->MaxNUp; pos++) {
1758	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1759	destpos[pos].re = -((Psi[i].re)posfac[pos].re-(Psi[i].im)posfac[pos].im);
1760	destpos[pos].im = -((Psi[i].re)posfac[pos].im+(Psi[i].im)posfac[pos].re);
1761	}
1762	}
1763	break;
1764	case 2:
1765	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is negative
1766	Index = LevS->GArray[i].Index;
1767	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1768	destpos = &tempdestRC[LevS->MaxNUp*Index];
1769	for (pos=0; pos < LevS->MaxNUp; pos++) {
1770	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1771	destpos[pos].re = (-Psi[i].im)posfac[pos].re-(Psi[i].re)posfac[pos].im;
1772	destpos[pos].im = (-Psi[i].im)posfac[pos].im+(Psi[i].re)posfac[pos].re;
1773	}
1774	}
1775	break;
1776	case 3:
1777	for (i=0;i<LevS->MaxG;i++) { // incoming is negative, outgoing is positive
1778	Index = LevS->GArray[i].Index;
1779	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1780	destpos = &tempdestRC[LevS->MaxNUp*Index];
1781	for (pos=0; pos < LevS->MaxNUp; pos++) {
1782	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1783	destpos[pos].re = (Psi[i].im)posfac[pos].re-(-Psi[i].re)posfac[pos].im;
1784	destpos[pos].im = (Psi[i].im)posfac[pos].im+(-Psi[i].re)posfac[pos].re;
1785	}
1786	}
1787	break;
1788	case 4:
1789	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
1790	Index = LevS->GArray[i].Index;
1791	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1792	destpos = &tempdestRC[LevS->MaxNUp*Index];
1793	for (pos=0; pos < LevS->MaxNUp; pos++) {
1794	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1795	destpos[pos].re = LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].re-(Psi[i].im)*posfac[pos].im);
1796	destpos[pos].im = LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].im+(Psi[i].im)*posfac[pos].re);
1797	}
1798	}
1799	break;
1800	case 5:
1801	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is - positive
1802	Index = LevS->GArray[i].Index;
1803	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1804	destpos = &tempdestRC[LevS->MaxNUp*Index];
1805	for (pos=0; pos < LevS->MaxNUp; pos++) {
1806	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1807	destpos[pos].re = -LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].re-(Psi[i].im)*posfac[pos].im);
1808	destpos[pos].im = -LevS->GArray[i].G[index_g]((Psi[i].re)posfac[pos].im+(Psi[i].im)*posfac[pos].re);
1809	}
1810	}
1811	break;
1812	case 6:
1813	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is negative
1814	Index = LevS->GArray[i].Index;
1815	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1816	destpos = &tempdestRC[LevS->MaxNUp*Index];
1817	for (pos=0; pos < LevS->MaxNUp; pos++) {
1818	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1819	destpos[pos].re = LevS->GArray[i].G[index_g]((-Psi[i].im)posfac[pos].re-(Psi[i].re)*posfac[pos].im);
1820	destpos[pos].im = LevS->GArray[i].G[index_g]((-Psi[i].im)posfac[pos].im+(Psi[i].re)*posfac[pos].re);
1821	}
1822	}
1823	break;
1824	case 7:
1825	for (i=0;i<LevS->MaxG;i++) { // incoming is negative, outgoing is positive
1826	Index = LevS->GArray[i].Index;
1827	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
1828	destpos = &tempdestRC[LevS->MaxNUp*Index];
1829	for (pos=0; pos < LevS->MaxNUp; pos++) {
1830	//if (destpos != &tempdestRC[LevS->MaxNUpIndex] \|\| LevS->MaxNUpIndex+pos<0 \|\| LevS->MaxNUp*Index+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destpos corrupted");
1831	destpos[pos].re = LevS->GArray[i].G[index_g]((Psi[i].im)posfac[pos].re-(-Psi[i].re)*posfac[pos].im);
1832	destpos[pos].im = LevS->GArray[i].G[index_g]((Psi[i].im)posfac[pos].im+(-Psi[i].re)*posfac[pos].re);
1833	}
1834	}
1835	break;
1836	}
1837	for (i=0; i<LevS->MaxDoubleG; i++) {
1838	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
1839	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
1840	for (pos=0; pos < LevS->MaxNUp; pos++) {
1841	//if (destRCD != &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp] \|\| LevS->DoubleG[2i+1]LevS->MaxNUp+pos<0 \|\| LevS->DoubleG[2i+1]LevS->MaxNUp+pos>=Dens0->TotalSize) Error(SomeError,"fft_Psi: destRCD corrupted");
1842	destRCD[pos].re = destRCS[pos].re;
1843	destRCD[pos].im = -destRCS[pos].im;
1844	}
1845	}
1846	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
1847	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, PsiR);
1848	UnLockDensityArray(Dens0,TempDensity,imag); // tempdestRC
1849	}
1850
1851	/** Locks all NDIM_NDIM current density arrays
1852	* \param Dens0 Density structure to be locked (in the current parts)
1853	*/
1854	void AllocCurrentDensity(struct Density *Dens0) {
1855	// real
1856	LockDensityArray(Dens0,CurrentDensity0,real); // CurrentDensity[B_index]
1857	LockDensityArray(Dens0,CurrentDensity1,real); // CurrentDensity[B_index]
1858	LockDensityArray(Dens0,CurrentDensity2,real); // CurrentDensity[B_index]
1859	LockDensityArray(Dens0,CurrentDensity3,real); // CurrentDensity[B_index]
1860	LockDensityArray(Dens0,CurrentDensity4,real); // CurrentDensity[B_index]
1861	LockDensityArray(Dens0,CurrentDensity5,real); // CurrentDensity[B_index]
1862	LockDensityArray(Dens0,CurrentDensity6,real); // CurrentDensity[B_index]
1863	LockDensityArray(Dens0,CurrentDensity7,real); // CurrentDensity[B_index]
1864	LockDensityArray(Dens0,CurrentDensity8,real); // CurrentDensity[B_index]
1865	// imaginary
1866	LockDensityArray(Dens0,CurrentDensity0,imag); // CurrentDensity[B_index]
1867	LockDensityArray(Dens0,CurrentDensity1,imag); // CurrentDensity[B_index]
1868	LockDensityArray(Dens0,CurrentDensity2,imag); // CurrentDensity[B_index]
1869	LockDensityArray(Dens0,CurrentDensity3,imag); // CurrentDensity[B_index]
1870	LockDensityArray(Dens0,CurrentDensity4,imag); // CurrentDensity[B_index]
1871	LockDensityArray(Dens0,CurrentDensity5,imag); // CurrentDensity[B_index]
1872	LockDensityArray(Dens0,CurrentDensity6,imag); // CurrentDensity[B_index]
1873	LockDensityArray(Dens0,CurrentDensity7,imag); // CurrentDensity[B_index]
1874	LockDensityArray(Dens0,CurrentDensity8,imag); // CurrentDensity[B_index]
1875	}
1876
1877	/** Reset and unlocks all NDIM_NDIM current density arrays
1878	* \param Dens0 Density structure to be unlocked/resetted (in the current parts)
1879	*/
1880	void DisAllocCurrentDensity(struct Density *Dens0) {
1881	//int i;
1882	// real
1883	// for(i=0;i<NDIM*NDIM;i++)
1884	// SetArrayToDouble0((double )Dens0->DensityArray[i], Dens0->TotalSize2);
1885	UnLockDensityArray(Dens0,CurrentDensity0,real); // CurrentDensity[B_index]
1886	UnLockDensityArray(Dens0,CurrentDensity1,real); // CurrentDensity[B_index]
1887	UnLockDensityArray(Dens0,CurrentDensity2,real); // CurrentDensity[B_index]
1888	UnLockDensityArray(Dens0,CurrentDensity3,real); // CurrentDensity[B_index]
1889	UnLockDensityArray(Dens0,CurrentDensity4,real); // CurrentDensity[B_index]
1890	UnLockDensityArray(Dens0,CurrentDensity5,real); // CurrentDensity[B_index]
1891	UnLockDensityArray(Dens0,CurrentDensity6,real); // CurrentDensity[B_index]
1892	UnLockDensityArray(Dens0,CurrentDensity7,real); // CurrentDensity[B_index]
1893	UnLockDensityArray(Dens0,CurrentDensity8,real); // CurrentDensity[B_index]
1894	// imaginary
1895	// for(i=0;i<NDIM*NDIM;i++)
1896	// SetArrayToDouble0((double )Dens0->DensityCArray[i], Dens0->TotalSize2);
1897	UnLockDensityArray(Dens0,CurrentDensity0,imag); // CurrentDensity[B_index]
1898	UnLockDensityArray(Dens0,CurrentDensity1,imag); // CurrentDensity[B_index]
1899	UnLockDensityArray(Dens0,CurrentDensity2,imag); // CurrentDensity[B_index]
1900	UnLockDensityArray(Dens0,CurrentDensity3,imag); // CurrentDensity[B_index]
1901	UnLockDensityArray(Dens0,CurrentDensity4,imag); // CurrentDensity[B_index]
1902	UnLockDensityArray(Dens0,CurrentDensity5,imag); // CurrentDensity[B_index]
1903	UnLockDensityArray(Dens0,CurrentDensity6,imag); // CurrentDensity[B_index]
1904	UnLockDensityArray(Dens0,CurrentDensity7,imag); // CurrentDensity[B_index]
1905	UnLockDensityArray(Dens0,CurrentDensity8,imag); // CurrentDensity[B_index]
1906	}
1907
1908	// these defines safe-guard same symmetry for same kind of wave function
1909	#define Psi0symmetry 0 // //0 //0 //0 // regard psi0 as real
1910	#define Psi1symmetry 0 // //3 //0 //0 // regard psi0 as real
1911	#define Psip0symmetry 6 //6 //6 //6 //6 // momentum times "i" due to operation on left hand
1912	#define Psip1symmetry 7 //7 //4 //6 //7 // momentum times "-i" as usual (right hand)
1913
1914	/** Evaluates the 3x3 current density arrays.
1915	* The formula we want to evaluate is as follows
1916	* \f[
1917	* j_k(r) = \langle \psi_k^{(0)} \| \Bigl ( p\|r'\rangle\langle r' \| + \| r' \rangle \langle r' \| p \Bigr )
1918	\Bigl [ \| \psi_k^{(r\times p )} \rangle - r' \times \| \psi_k^{(p)} \rangle \Bigr ] \cdot B.
1919	* \f]
1920	* Most of the DensityTypes-arrays are locked for temporary use. Pointers are set to their
1921	* start address and afterwards the current density arrays locked and reset'ed. Then for every
1922	* unperturbed wave function we do:
1923	* -# FFT unperturbed p-perturbed and rxp-perturbed wave function
1924	* -# FFT wave function with applied momentum operator for all three indices
1925	* -# For each index of the momentum operator:
1926	* -# FFT p-perturbed wave function
1927	* -# For every index of the external field:
1928	* -# FFT rxp-perturbed wave function
1929	* -# Evaluate current density for these momentum index and external field indices
1930	*
1931	* Afterwards the temporary densities are unlocked and the density ones gathered from all Psi-
1932	* sharing processes.
1933	*
1934	* \param *P Problem at hand, containing Lattice and RunStruct
1935	*/
1936	void FillCurrentDensity(struct Problem *P)
1937	{
1938	struct Lattice *Lat = &P->Lat;
1939	struct RunStruct *R = &P->R;
1940	struct Psis *Psi = &Lat->Psi;
1941	struct LatticeLevel *LevS = R->LevS;
1942	struct LatticeLevel *Lev0 = R->Lev0;
1943	struct Density *Dens0 = Lev0->Dens;
1944	fftw_complex *Psi0;
1945	fftw_real Psi0R, Psip0R;
1946	fftw_real CurrentDensity[NDIMNDIM];
1947	fftw_real *Psi1R;
1948	fftw_real *Psip1R;
1949	fftw_real *tempArray; // intendedly the same
1950	double r_bar[NDIM], x[NDIM], fac[NDIM];
1951	double Current;//, current;
1952	const double UnitsFactor = 1.; ///LevS->MaxN; // 1/N (from ff-backtransform)
1953	int i, index, B_index;
1954	int k, j, i0;
1955	int n[NDIM], n0;
1956	int N[NDIM];
1957	N[0] = Lev0->Plan0.plan->N[0];
1958	N[1] = Lev0->Plan0.plan->N[1];
1959	N[2] = Lev0->Plan0.plan->N[2];
1960	const int N0 = Lev0->Plan0.plan->local_nx;
1961	//int ActNum;
1962	const int myPE = P->Par.me_comm_ST_Psi;
1963	const int type = R->CurrentMin;
1964	MPI_Status status;
1965	int cross_lookup_1[4], cross_lookup_3[4], l_1 = 0, l_3 = 0;
1966
1967	//fprintf(stderr,"(%i) FactoR %e\n", P->Par.me, R->FactorDensityR);
1968
1969	// Init values and pointers
1970	if (P->Call.out[PsiOut]) {
1971	fprintf(stderr,"(%i) LockArray: ", P->Par.me);
1972	for(i=0;i<MaxDensityTypes;i++)
1973	fprintf(stderr,"(%i,%i) ",Dens0->LockArray[i],Dens0->LockCArray[i]);
1974	fprintf(stderr,"\n");
1975	}
1976	LockDensityArray(Dens0,Temp2Density,real); // Psi1R
1977	LockDensityArray(Dens0,Temp2Density,imag); // Psip1R and tempArray
1978	LockDensityArray(Dens0,GapDensity,real); // Psi0R
1979	LockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
1980
1981	Psi0R = (fftw_real *)Dens0->DensityArray[GapDensity];
1982	Psip0R = (fftw_real *)Dens0->DensityArray[GapLocalDensity];
1983	Psi1R = (fftw_real *)Dens0->DensityArray[Temp2Density];
1984	tempArray = Psip1R = (fftw_real *)Dens0->DensityCArray[Temp2Density];
1985	SetArrayToDouble0((double )Psi0R,Dens0->TotalSize2);
1986	SetArrayToDouble0((double )Psip0R,Dens0->TotalSize2);
1987	SetArrayToDouble0((double )Psi1R,Dens0->TotalSize2);
1988	SetArrayToDouble0((double )Psip1R,Dens0->TotalSize2);
1989
1990	if (P->Call.out[PsiOut]) {
1991	fprintf(stderr,"(%i) LockArray: ", P->Par.me);
1992	for(i=0;i<MaxDensityTypes;i++)
1993	fprintf(stderr,"(%i,%i) ",Dens0->LockArray[i],Dens0->LockCArray[i]);
1994	fprintf(stderr,"\n");
1995	}
1996
1997	// don't put the following stuff into a for loop, they might not be continuous! (preprocessor values: CurrentDensity...)
1998	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
1999	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
2000	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
2001	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
2002	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
2003	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
2004	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
2005	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
2006	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
2007
2008	// initialize the array if it is the first of all six perturbation run
2009	if ((R->DoFullCurrent == 0) && (R->CurrentMin == Perturbed_P0)) { // reset if FillDelta...() hasn't done it before
2010	debug(P,"resetting CurrentDensity...");
2011	for (B_index=0; B_index<NDIM*NDIM; B_index++) // initialize current density array
2012	SetArrayToDouble0((double )CurrentDensity[B_index],Dens0->TotalSize2); // DensityArray is fftw_real, no 2*LocalSizeR here!
2013	}
2014
2015	switch(type) { // set j (which is linked to the index from derivation wrt to B^{ext})
2016	case Perturbed_P0:
2017	case Perturbed_P1:
2018	case Perturbed_P2:
2019	j = type - Perturbed_P0;
2020	l_1 = crossed(j,1);
2021	l_3 = crossed(j,3);
2022	for(k=0;k<4;k++) {
2023	cross_lookup_1[k] = cross(l_1,k);
2024	cross_lookup_3[k] = cross(l_3,k);
2025	}
2026	break;
2027	case Perturbed_RxP0:
2028	case Perturbed_RxP1:
2029	case Perturbed_RxP2:
2030	j = type - Perturbed_RxP0;
2031	break;
2032	default:
2033	j = 0;
2034	Error(SomeError,"FillCurrentDensity() called while not in perturbed minimisation!");
2035	break;
2036	}
2037
2038	int wished = -1;
2039	FILE *file = fopen(P->Call.MainParameterFile,"r");
2040	if (!ParseForParameter(1,file,"Orbital",0,1,1,int_type,&wished, 1, optional)) {
2041	fprintf(stderr,"Desired Orbital missing!\n");
2042	wished = -1;
2043	} else if (wished != -1) {
2044	fprintf(stderr,"Desired Orbital is: %i.\n", wished);
2045	} else {
2046	fprintf(stderr,"Desired Orbital is: All.\n");
2047	}
2048	fclose(file);
2049
2050	// Commence grid filling
2051	for (k=Psi->TypeStartIndex[Occupied];k<Psi->TypeStartIndex[Occupied+1];k++) // every local wave functions adds up its part of the current
2052	if ((k + P->Par.me_comm_ST_PsiT*(Psi->TypeStartIndex[UnOccupied]-Psi->TypeStartIndex[Occupied]) == wished) \|\| (wished == -1)) { // compare with global number
2053	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i)Calculating Current Density Summand of type %s for Psi (%i/%i) ... \n", P->Par.me, R->MinimisationName[type], Psi->LocalPsiStatus[k].MyGlobalNo, k);
2054	//ActNum = k - Psi->TypeStartIndex[Occupied] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[k].my_color_comm_ST_Psi; // global number of unperturbed Psi
2055	Psi0 = LevS->LPsi->LocalPsi[k]; // Local unperturbed psi
2056
2057	// now some preemptive ffts for the whole grid
2058	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi0> one level up and fftransforming\n", P->Par.me);
2059	fft_Psi(P, Psi0, Psi0R, 0, Psi0symmetry); //0 // 0 //0
2060
2061	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi1> one level up and fftransforming\n", P->Par.me);
2062	fft_Psi(P, LevS->LPsi->LocalPsi[Psi->TypeStartIndex[type]+k], Psi1R, 0, Psi1symmetry); //3 //0 //0
2063
2064	for (index=0;index<NDIM;index++) { // for all NDIM components of momentum operator
2065
2066	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi0> one level up and fftransforming\n", P->Par.me);
2067	fft_Psi(P, Psi0, Psip0R, index, Psip0symmetry); //6 //6 //6
2068
2069	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi1> one level up and fftransforming\n", P->Par.me);
2070	fft_Psi(P, LevS->LPsi->LocalPsi[Psi->TypeStartIndex[type]+k], Psip1R, index, Psip1symmetry); //4 //6 //7
2071
2072	// then for every point on the grid in real space ...
2073
2074	//if (Psi1R != (fftw_real *)Dens0->DensityArray[Temp2Density] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"fft_Psi: Psi1R corrupted");
2075	//Psi1R[i0] = (Psi1_rxp_R[j])[i0] - (r_bar[cross(j,0)] * (Psi1_p_R[cross(j,1)])[i0] - r_bar[cross(j,2)] * (Psi1_p_R[cross(j,3)])[i0]); //
2076	//if (Psip1R != (fftw_real *)Dens0->DensityCArray[Temp2Density] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"fft_Psi: Psip1R corrupted");
2077	//Psip1R[i0] = Psi1_rxp_pR[i0] - (r_bar[cross(j,0)] * (Psi1_p_pR[cross(j,1)])[i0] - r_bar[cross(j,2)] * (Psi1_p_pR[cross(j,3)])[i0]); //
2078
2079	switch(type) {
2080	case Perturbed_P0:
2081	case Perturbed_P1:
2082	case Perturbed_P2:
2083	for (n0=0;n0<N0;n0++) // only local points on x axis
2084	for (n[1]=0;n[1]<N[1];n[1]++)
2085	for (n[2]=0;n[2]<N[2];n[2]++) {
2086	i0 = n[2]+N[2](n[1]+N[1]n0);
2087	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
2088	fac[0] = (double)n[0]/(double)N[0];
2089	fac[1] = (double)n[1]/(double)N[1];
2090	fac[2] = (double)n[2]/(double)N[2];
2091	RMat33Vec3(x, Lat->RealBasis, fac); // relative coordinate times basis matrix gives absolute ones
2092	for (i=0;i<NDIM;i++) // build gauge-translated r_bar evaluation point
2093	r_bar[i] =
2094	sawtooth(Lat,MinImageConv(Lat, x[i], Psi->AddData[k].WannierCentre[i], i),i);
2095	// ShiftGaugeOrigin(P,truedist(Lat, x[i], Psi->AddData[k].WannierCentre[i], i),i);
2096	//truedist(Lat, x[i], Psi->AddData[k].WannierCentre[i], i);
2097
2098	Current = Psip0R[i0] * (r_bar[cross_lookup_1[0]] * Psi1R[i0]);
2099	Current += (Psi0R[i0] * r_bar[cross_lookup_1[0]] * Psip1R[i0]);
2100	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
2101	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2102	CurrentDensity[index+l_1*NDIM][i0] -= Current; // note: sign of cross product resides in Current itself (here: plus)
2103
2104	Current = - Psip0R[i0] * (r_bar[cross_lookup_3[2]] * Psi1R[i0]);
2105	Current += - (Psi0R[i0] * r_bar[cross_lookup_3[2]] * Psip1R[i0]);
2106	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
2107	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2108	CurrentDensity[index+l_3*NDIM][i0] -= Current; // note: sign of cross product resides in Current itself (here: minus)
2109	}
2110	break;
2111	case Perturbed_RxP0:
2112	case Perturbed_RxP1:
2113	case Perturbed_RxP2:
2114	for (n0=0;n0<N0;n0++) // only local points on x axis
2115	for (n[1]=0;n[1]<N[1];n[1]++)
2116	for (n[2]=0;n[2]<N[2];n[2]++) {
2117	i0 = n[2]+N[2](n[1]+N[1]n0);
2118	Current = (Psip0R[i0] * Psi1R[i0] + Psi0R[i0] * Psip1R[i0]);
2119	Current = .5 UnitsFactor * Psi->LocalPsiStatus[k].PsiFactor * R->FactorDensityR; // factor confirmed, see CalculateOneDensityR() and InitDensityCalculation()
2120	////if (CurrentDensity[index+jNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+jNDIM] \|\| i0<0 \|\| i0>=Dens0->LocalSizeR \|\| (index+jNDIM)<0 \|\| (index+jNDIM)>=NDIMNDIM) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2121	CurrentDensity[index+j*NDIM][i0] += Current;
2122	}
2123	break;
2124	default:
2125	break;
2126	}
2127	}
2128	//OutputCurrentDensity(P);
2129	}
2130
2131	//debug(P,"Unlocking arrays");
2132	//debug(P,"GapDensity");
2133	UnLockDensityArray(Dens0,GapDensity,real); // Psi0R
2134	//debug(P,"GapLocalDensity");
2135	UnLockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
2136	//debug(P,"Temp2Density");
2137	UnLockDensityArray(Dens0,Temp2Density,real); // Psi1R
2138
2139	// if (P->Call.out[StepLeaderOut])
2140	// fprintf(stderr,"\n\n");
2141
2142	//debug(P,"MPI operation");
2143	// and in the end gather partial densities from other processes
2144	if (type == Perturbed_RxP2) // exchange all (due to shared wave functions) only after last pertubation run
2145	for (index=0;index<NDIM*NDIM;index++) {
2146	//if (tempArray != (fftw_real *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"FillCurrentDensity: tempArray corrupted");
2147	//debug(P,"tempArray to zero");
2148	SetArrayToDouble0((double )tempArray, Dens0->TotalSize2);
2149	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index]) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2150	//debug(P,"CurrentDensity exchange");
2151	MPI_Allreduce( CurrentDensity[index], tempArray, Dens0->LocalSizeR, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_PsiT); // gather results from all wave functions ...
2152	switch(Psi->PsiST) { // ... and also from SpinUp/Downs
2153	default:
2154	//debug(P,"CurrentDensity = tempArray");
2155	for (i=0;i<Dens0->LocalSizeR;i++) {
2156	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2157	CurrentDensity[index][i] = tempArray[i];
2158	}
2159	break;
2160	case SpinUp:
2161	//debug(P,"CurrentDensity exchange spinup");
2162	MPI_Sendrecv(tempArray, Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag1,
2163	CurrentDensity[index], Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag2, P->Par.comm_STInter, &status );
2164	//debug(P,"CurrentDensity += tempArray");
2165	for (i=0;i<Dens0->LocalSizeR;i++) {
2166	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2167	CurrentDensity[index][i] += tempArray[i];
2168	}
2169	break;
2170	case SpinDown:
2171	//debug(P,"CurrentDensity exchange spindown");
2172	MPI_Sendrecv(tempArray, Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag2,
2173	CurrentDensity[index], Dens0->LocalSizeR, MPI_DOUBLE, P->Par.me_comm_ST, CurrentTag1, P->Par.comm_STInter, &status );
2174	//debug(P,"CurrentDensity += tempArray");
2175	for (i=0;i<Dens0->LocalSizeR;i++) {
2176	////if (CurrentDensity[index] != (fftw_real *) Dens0->DensityArray[CurrentDensity0 + index] \|\| i<0 \|\| i>=Dens0->LocalSizeR) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2177	CurrentDensity[index][i] += tempArray[i];
2178	}
2179	break;
2180	}
2181	}
2182	//debug(P,"Temp2Density");
2183	UnLockDensityArray(Dens0,Temp2Density,imag); // Psip1R and tempArray
2184	//debug(P,"CurrentDensity end");
2185	}
2186
2187	/** Structure holding Problem at hand and two indices, defining the greens function to be inverted.
2188	*/
2189	struct params
2190	{
2191	struct Problem *P;
2192	int *k;
2193	int *l;
2194	int *iter;
2195	fftw_complex *x_l;
2196	};
2197
2198	/** Wrapper function to solve G_kl x = b for x.
2199	* \param *x above x
2200	* \param *param additional parameters, here Problem at hand
2201	* \return evaluated to be minimized functional \f$\frac{1}{2}x \cdot Ax - xb\f$ at \a x on return
2202	*/
2203	static double DeltaCurrent_f(const gsl_vector * x, void * param)
2204	{
2205	struct Problem P = ((struct params )param)->P;
2206	struct RunStruct *R = &P->R;
2207	struct LatticeLevel *LevS = R->LevS;
2208	struct Psis *Psi = &P->Lat.Psi;
2209	struct PseudoPot *PP = &P->PP;
2210	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
2211	double result = 0.;
2212	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
2213	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
2214	int u;
2215
2216	//fprintf(stderr,"Evaluating f(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
2217
2218	// extract gsl_vector
2219	for (u=0;u<LevS->MaxG;u++) {
2220	TempPsi[u].re = gsl_vector_get(x, 2*u);
2221	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
2222	}
2223	// generate fnl
2224	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
2225	// Apply Hamiltonian to x
2226	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
2227	// take scalar product to get eigen value
2228	result = .5 * PsiFactor * (((((struct params )param)->k == ((struct params )param)->l ? GradSP(P,LevS,TempPsi,TempPsi2) : 0.) - Psi->lambda[((struct params )param)->k][((struct params )param)->l])) - GradSP(P,LevS,TempPsi,LevS->LPsi->LocalPsi[((struct params )param)->l]);
2229	return result;
2230	}
2231
2232	/** Wrapper function to solve G_kl x = b for x.
2233	* \param *x above x
2234	* \param *param additional parameters, here Problem at hand
2235	* \param *g gradient vector on return
2236	* \return error code
2237	*/
2238	static void DeltaCurrent_df(const gsl_vector * x, void * param, gsl_vector * g)
2239	{
2240	struct Problem P = ((struct params )param)->P;
2241	struct RunStruct *R = &P->R;
2242	struct LatticeLevel *LevS = R->LevS;
2243	struct Psis *Psi = &P->Lat.Psi;
2244	struct PseudoPot *PP = &P->PP;
2245	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
2246	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
2247	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
2248	fftw_complex x_l = ((struct params )param)->x_l;
2249	int u;
2250
2251	//fprintf(stderr,"Evaluating df(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
2252
2253	// extract gsl_vector
2254	for (u=0;u<LevS->MaxG;u++) {
2255	TempPsi[u].re = gsl_vector_get(x, 2*u);
2256	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
2257	}
2258	// generate fnl
2259	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
2260	// Apply Hamiltonian to x
2261	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
2262	// put into returning vector
2263	for (u=0;u<LevS->MaxG;u++) {
2264	gsl_vector_set(g, 2*u, TempPsi2[u].re - x_l[u].re);
2265	gsl_vector_set(g, 2*u+1, TempPsi2[u].im - x_l[u].im);
2266	}
2267	}
2268
2269	/** Wrapper function to solve G_kl x = b for x.
2270	* \param *x above x
2271	* \param *param additional parameters, here Problem at hand
2272	* \param *f evaluated to be minimized functional \f$\frac{1}{2}x \cdot Ax - xb\f$ at \a x on return
2273	* \param *g gradient vector on return
2274	* \return error code
2275	*/
2276	static void DeltaCurrent_fdf(const gsl_vector * x, void * param, double * f, gsl_vector * g)
2277	{
2278	struct Problem P = ((struct params )param)->P;
2279	struct RunStruct *R = &P->R;
2280	struct LatticeLevel *LevS = R->LevS;
2281	struct Psis *Psi = &P->Lat.Psi;
2282	struct PseudoPot *PP = &P->PP;
2283	const double PsiFactor = Psi->AllPsiStatus[((struct params )param)->k].PsiFactor;
2284	fftw_complex *TempPsi = LevS->LPsi->TempPsi;
2285	fftw_complex *TempPsi2 = LevS->LPsi->TempPsi2;
2286	fftw_complex x_l = ((struct params )param)->x_l;
2287	int u;
2288
2289	//fprintf(stderr,"Evaluating fdf(%i,%i) for %i-th time\n", ((struct params )param)->k, ((struct params )param)->l, ((struct params )param)->iter);
2290
2291	// extract gsl_vector
2292	for (u=0;u<LevS->MaxG;u++) {
2293	TempPsi[u].re = gsl_vector_get(x, 2*u);
2294	TempPsi[u].im = gsl_vector_get(x, 2*u+1);
2295	}
2296	// generate fnl
2297	CalculateCDfnl(P, TempPsi, PP->CDfnl); // calculate needed non-local form factors
2298	// Apply Hamiltonian to x
2299	ApplyTotalHamiltonian(P,TempPsi,TempPsi2, PP->CDfnl,PsiFactor,0);
2300	// put into returning vector
2301	for (u=0;u<LevS->MaxG;u++) {
2302	gsl_vector_set(g, 2*u, TempPsi[u].re - x_l[u].re);
2303	gsl_vector_set(g, 2*u+1, TempPsi[u].im - x_l[u].im);
2304	}
2305
2306	f = .5 PsiFactor * (((((struct params )param)->k == ((struct params )param)->l ? GradSP(P,LevS,TempPsi,TempPsi2) : 0.) - Psi->lambda[((struct params )param)->k][((struct params )param)->l])) - GradSP(P,LevS,TempPsi,LevS->LPsi->LocalPsi[((struct params )param)->l]);
2307	}
2308
2309	/** Evaluates the \f$\Delta j_k(r')\f$ component of the current density.
2310	* \f[
2311	* \Delta j_k(r') = \frac{e}{m} \sum_l \langle \varphi^{(0)}_k \| \left ( p \|r'\rangle \langle r'\| + \| r'\rangle\langle r'\|p \right ) {\cal G}_{kl} (d_k - d_l) \times p \| \varphi^{(1)}_l \rangle \cdot B
2312	* \f]
2313	* \param *P Problem at hand
2314	* \note result has not yet been MPI_Allreduced for ParallelSimulationData#comm_ST_inter or ParallelSimulationData#comm_ST_PsiT groups!
2315	* \warning the routine is checked but does not yet produce sensible results.
2316	*/
2317	void FillDeltaCurrentDensity(struct Problem *P)
2318	{
2319	struct Lattice *Lat = &P->Lat;
2320	struct RunStruct *R = &P->R;
2321	struct Psis *Psi = &Lat->Psi;
2322	struct LatticeLevel *Lev0 = R->Lev0;
2323	struct LatticeLevel *LevS = R->LevS;
2324	struct Density *Dens0 = Lev0->Dens;
2325	int i,j,s;
2326	int k,l,u, in, dex, index,i0;
2327	//const int Num = Psi->NoOfPsis;
2328	int RecvSource;
2329	MPI_Status status;
2330	struct OnePsiElement OnePsiB, LOnePsiB, OnePsiA, LOnePsiA;
2331	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
2332	int n[NDIM], n0;
2333	int N[NDIM];
2334	N[0] = Lev0->Plan0.plan->N[0];
2335	N[1] = Lev0->Plan0.plan->N[1];
2336	N[2] = Lev0->Plan0.plan->N[2];
2337	const int N0 = Lev0->Plan0.plan->local_nx;
2338	fftw_complex *LPsiDatB;
2339	fftw_complex Psi0, Psi1;
2340	fftw_real Psi0R, Psip0R;
2341	fftw_real Psi1R, Psip1R;
2342	fftw_complex x_l = LevS->LPsi->TempPsi;//, *x_l_bak;
2343	fftw_real CurrentDensity[NDIMNDIM];
2344	int mem_avail, MEM_avail;
2345	double Current;
2346	const double UnitsFactor = 1.;
2347	int cross_lookup[4];
2348	struct params param;
2349	double factor; // temporary factor in Psi1 pre-evaluation
2350
2351	LockDensityArray(Dens0,GapDensity,real); // Psi0R
2352	LockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
2353	LockDensityArray(Dens0,Temp2Density,imag); // Psi1
2354	LockDensityArray(Dens0,GapUpDensity,real); // Psi1R
2355	LockDensityArray(Dens0,GapDownDensity,real); // Psip1R
2356
2357	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
2358	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
2359	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
2360	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
2361	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
2362	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
2363	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
2364	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
2365	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
2366
2367	Psi0R = (fftw_real *)Dens0->DensityArray[GapDensity];
2368	Psip0R = (fftw_real *)Dens0->DensityArray[GapLocalDensity];
2369	Psi1 = (fftw_complex *) Dens0->DensityCArray[Temp2Density];
2370	Psi1R = (fftw_real *)Dens0->DensityArray[GapUpDensity];
2371	Psip1R = (fftw_real *)Dens0->DensityArray[GapDownDensity];
2372
2373	// if (R->CurrentMin == Perturbed_P0)
2374	// for (B_index=0; B_index<NDIM*NDIM; B_index++) { // initialize current density array
2375	// debug(P,"resetting CurrentDensity...");
2376	// SetArrayToDouble0((double )CurrentDensity[B_index],Dens0->TotalSize2); // DensityArray is fftw_real, no 2*LocalSizeR here!
2377	// }
2378	//if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density]) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
2379	SetArrayToDouble0((double )Psi1,2Dens0->TotalSize);
2380
2381	// gsl_vector *x = gsl_vector_alloc(Num);
2382	// gsl_matrix *G = gsl_matrix_alloc(Num,Num);
2383	// gsl_permutation *p = gsl_permutation_alloc(Num);
2384	//int signum;
2385	// begin of GSL linearer CG solver stuff
2386	int iter, Status;
2387
2388	const gsl_multimin_fdfminimizer_type *T;
2389	gsl_multimin_fdfminimizer *minset;
2390
2391	/* Position of the minimum (1,2). */
2392	//double par[2] = { 1.0, 2.0 };
2393
2394	gsl_vector *x;
2395	gsl_multimin_function_fdf my_func;
2396
2397	param.P = P;
2398	param.k = &k;
2399	param.l = &l;
2400	param.iter = &iter;
2401	param.x_l = x_l;
2402
2403	my_func.f = &DeltaCurrent_f;
2404	my_func.df = &DeltaCurrent_df;
2405	my_func.fdf = &DeltaCurrent_fdf;
2406	my_func.n = 2*LevS->MaxG;
2407	my_func.params = (void *)&param;
2408
2409	T = gsl_multimin_fdfminimizer_conjugate_pr;
2410	minset = gsl_multimin_fdfminimizer_alloc (T, 2*LevS->MaxG);
2411	x = gsl_vector_alloc (2*LevS->MaxG);
2412	// end of GSL CG stuff
2413
2414
2415	// // construct G_kl = - (H^{(0)} \delta_{kl} -\langle \varphi^{(0)}_k \|H^{(0)}\| \varphi^{(0)}_l\|rangle)^{-1} = A^{-1}
2416	// for (k=0;k<Num;k++)
2417	// for (l=0;l<Num;l++)
2418	// gsl_matrix_set(G, k, l, k == l ? 0. : Psi->lambda[k][l]);
2419	// // and decompose G_kl = L U
2420
2421	mem_avail = MEM_avail = 0;
2422	// x_l_bak = x_l = (fftw_complex *) Malloc(sizeof(fftw_complex )Num,"FillDeltaCurrentDensity: x_l");
2423	// for (i=0;i<Num;i++) {
2424	// x_l[i] = NULL;
2425	// x_l[i] = (fftw_complex ) malloc(sizeof(fftw_complex)LevS->MaxG);
2426	// if (x_l[i] == NULL) {
2427	// mem_avail = 1; // there was not enough memory for this node
2428	// fprintf(stderr,"(%i) FillDeltaCurrentDensity: x_l[%i] ... insufficient memory.\n",P->Par.me,i);
2429	// }
2430	// }
2431	// MPI_Allreduce(&mem_avail,&MEM_avail,1,MPI_INT,MPI_SUM,P->Par.comm_ST); // sum results from all processes
2432
2433	if (MEM_avail != 0) { // means at least node couldn't allocate sufficient memory, skipping...
2434	fprintf(stderr,"(%i) FillDeltaCurrentDensity: x_l[], not enough memory: %i! Skipping FillDeltaCurrentDensity evaluation.", P->Par.me, MEM_avail);
2435	} else {
2436	// sum over k and calculate \Delta j_k(r')
2437	k=-1;
2438	for (i=0; i < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; i++) { // go through all wave functions
2439	//fprintf(stderr,"(%i) GlobalNo: %d\tLocalNo: %d\n", P->Par.me,Psi->AllPsiStatus[i].MyGlobalNo,Psi->AllPsiStatus[i].MyLocalNo);
2440	OnePsiA = &Psi->AllPsiStatus[i]; // grab OnePsiA
2441	if (OnePsiA->PsiType == Occupied) { // drop the extra and perturbed ones
2442	k++;
2443	if (OnePsiA->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
2444	LOnePsiA = &Psi->LocalPsiStatus[OnePsiA->MyLocalNo];
2445	else
2446	LOnePsiA = NULL;
2447	if (LOnePsiA != NULL) {
2448	Psi0=LevS->LPsi->LocalPsi[OnePsiA->MyLocalNo];
2449
2450	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi0> one level up and fftransforming\n", P->Par.me);
2451	//if (Psi0R != (fftw_real *)Dens0->DensityArray[GapDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psi0R corrupted");
2452	fft_Psi(P,Psi0,Psi0R, 0, Psi0symmetry); //0 // 0 //0
2453
2454	for (in=0;in<NDIM;in++) { // in is the index from derivation wrt to B^{ext}
2455	l = -1;
2456	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
2457	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiA
2458	if (OnePsiB->PsiType == Occupied)
2459	l++;
2460	if ((OnePsiB != OnePsiA) && (OnePsiB->PsiType == Occupied)) { // drop the same and the extra ones
2461	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
2462	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
2463	else
2464	LOnePsiB = NULL;
2465	if (LOnePsiB == NULL) { // if it's not local ... receive x from respective process
2466	RecvSource = OnePsiB->my_color_comm_ST_Psi;
2467	MPI_Recv( x_l, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, HamiltonianTag, P->Par.comm_ST_PsiT, &status );
2468	} else { // .. otherwise setup wave function as x ...
2469	// Evaluate cross product: \epsilon_{ijm} (d_k - d_l)_j p_m \| \varphi^{(0)} \rangle = b_i ... and
2470	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
2471	//LPsiDatx=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo+Psi->TypeStartIndex[Perturbed_P0]];
2472	//CalculatePerturbationOperator_P(P,LPsiDatB,LPsiDatB_p0,cross(in,1),0);
2473	//CalculatePerturbationOperator_P(P,LPsiDatB,LPsiDatB_p1,cross(in,3),0);
2474	for (dex=0;dex<4;dex++)
2475	cross_lookup[dex] = cross(in,dex);
2476	for(s=0;s<LevS->MaxG;s++) {
2477	//if (x_l != x_l_bak \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
2478	factor =
2479	(MinImageConv(Lat,Psi->AddData[LOnePsiA->MyLocalNo].WannierCentre[cross_lookup[0]],
2480	Psi->AddData[LOnePsiB->MyLocalNo].WannierCentre[cross_lookup[0]],cross_lookup[0]) * LevS->GArray[s].G[cross_lookup[1]] -
2481	MinImageConv(Lat,Psi->AddData[LOnePsiA->MyLocalNo].WannierCentre[cross_lookup[2]],
2482	Psi->AddData[LOnePsiB->MyLocalNo].WannierCentre[cross_lookup[2]],cross_lookup[2]) * LevS->GArray[s].G[cross_lookup[3]]);
2483	x_l[s].re = factor * (-LPsiDatB[s].im); // switched due to factorization with "-i G"
2484	x_l[s].im = factor * (LPsiDatB[s].re);
2485	}
2486	// ... and send it to all other processes (Max_me... - 1)
2487	for (u=0;u<P->Par.Max_me_comm_ST_PsiT;u++)
2488	if (u != OnePsiB->my_color_comm_ST_Psi)
2489	MPI_Send( x_l, LevS->MaxG*ElementSize, MPI_DOUBLE, u, HamiltonianTag, P->Par.comm_ST_PsiT);
2490	} // x_l row is now filled (either by receiving result or evaluating it on its own)
2491	// Solve Ax = b by minimizing 1/2 xAx -xb (gradient is residual Ax - b) with conjugate gradient polak-ribiere
2492
2493	debug(P,"fill starting point x with values from b");
2494	/* Starting point, x = b */
2495	for (u=0;u<LevS->MaxG;u++) {
2496	gsl_vector_set (x, 2*u, x_l[u].re);
2497	gsl_vector_set (x, 2*u+1, x_l[u].im);
2498	}
2499
2500	gsl_multimin_fdfminimizer_set (minset, &my_func, x, 0.01, 1e-4);
2501
2502	fprintf(stderr,"(%i) Start solving for (%i,%i) and index %i\n",P->Par.me, k,l,in);
2503	// start solving
2504	iter = 0;
2505	do
2506	{
2507	iter++;
2508	Status = gsl_multimin_fdfminimizer_iterate (minset);
2509
2510	if (Status)
2511	break;
2512
2513	Status = gsl_multimin_test_gradient (minset->gradient, 1e-3);
2514
2515	if (Status == GSL_SUCCESS)
2516	fprintf (stderr,"(%i) Minimum found after %i iterations.\n", P->Par.me, iter);
2517
2518	} while (Status == GSL_CONTINUE && iter < 100);
2519
2520	debug(P,"Put solution into Psi1");
2521	// ... and what do we do now? Put solution into Psi1!
2522	for(s=0;s<LevS->MaxG;s++) {
2523	//if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density] \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
2524	Psi1[s].re = gsl_vector_get (minset->x, 2*s);
2525	Psi1[s].im = gsl_vector_get (minset->x, 2*s+1);
2526	}
2527
2528	// // Solve A^{-1} b_i = x
2529	// for(s=0;s<LevS->MaxG;s++) {
2530	// // REAL PART
2531	// // retrieve column from gathered matrix
2532	// for(u=0;u<Num;u++)
2533	// gsl_vector_set(x,u,x_l[u][s].re);
2534	//
2535	// // solve: sum_l A_{kl}^(-1) b_l (s) = x_k (s)
2536	// gsl_linalg_LU_svx (G, p, x);
2537	//
2538	// // put solution back into x_l[s]
2539	// for(u=0;u<Num;u++) {
2540	// //if (x_l != x_l_bak \|\| s<0 \|\| s>=LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
2541	// x_l[u][s].re = gsl_vector_get(x,u);
2542	// }
2543	//
2544	// // IMAGINARY PART
2545	// // retrieve column from gathered matrix
2546	// for(u=0;u<Num;u++)
2547	// gsl_vector_set(x,u,x_l[u][s].im);
2548	//
2549	// // solve: sum_l A_{kl}^(-1) b_l (s) = x_k (s)
2550	// gsl_linalg_LU_svx (G, p, x);
2551	//
2552	// // put solution back into x_l[s]
2553	// for(u=0;u<Num;u++) {
2554	// //if (x_l != x_l_bak \|\| s<0 \|\| s>=LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: x_l[] corrupted");
2555	// x_l[u][s].im = gsl_vector_get(x,u);
2556	// }
2557	// } // now we have in x_l a vector similar to "Psi1" which we use to evaluate the current density
2558	//
2559	// // evaluate \Delta J_k ... mind the minus sign from G_kl!
2560	// // fill Psi1
2561	// for(s=0;s<LevS->MaxG;s++) {
2562	// //if (Psi1 != (fftw_complex *) Dens0->DensityCArray[Temp2Density] \|\| s<0 \|\| s>LevS->MaxG) Error(SomeError,"FillDeltaCurrentDensity: Psi1 corrupted");
2563	// Psi1[s].re = x_l[k][s].re;
2564	// Psi1[s].im = x_l[k][s].im;
2565	// }
2566
2567	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Bringing \|Psi1> one level up and fftransforming\n", P->Par.me);
2568	//if (Psi1R != (fftw_real *)Dens0->DensityArray[GapUpDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psi1R corrupted");
2569	fft_Psi(P,Psi1,Psi1R, 0, Psi1symmetry); //2 // 0 //0
2570
2571	for (index=0;index<NDIM;index++) { // for all NDIM components of momentum operator
2572
2573	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi0> one level up and fftransforming\n", P->Par.me);
2574	//if (Psip0R != (fftw_real *)Dens0->DensityArray[GapLocalDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psip0R corrupted");
2575	fft_Psi(P,Psi0,Psip0R, index, Psip0symmetry); //6 //6 //6
2576
2577	if ((P->Call.out[StepLeaderOut]) && (!index)) fprintf(stderr,"(%i) Bringing p\|Psi1> one level up and fftransforming\n", P->Par.me);
2578	//if (Psip1R != (fftw_real *)Dens0->DensityArray[GapDownDensity]) Error(SomeError,"FillDeltaCurrentDensity: Psip1R corrupted");
2579	fft_Psi(P,Psi1,Psip1R, index, Psip1symmetry); //4 //6 //6
2580
2581	// then for every point on the grid in real space ...
2582	for (n0=0;n0<N0;n0++) // only local points on x axis
2583	for (n[1]=0;n[1]<N[1];n[1]++)
2584	for (n[2]=0;n[2]<N[2];n[2]++) {
2585	i0 = n[2]+N[2](n[1]+N[1]n0);
2586	// and take the product
2587	Current = (Psip0R[i0] * Psi1R[i0] + Psi0R[i0] * Psip1R[i0]);
2588	Current = 0.5 UnitsFactor * Psi->AllPsiStatus[OnePsiA->MyGlobalNo].PsiFactor * R->FactorDensityR;
2589	////if (CurrentDensity[index+inNDIM] != (fftw_real ) Dens0->DensityArray[CurrentDensity0 + index+in*NDIM]) Error(SomeError,"FillCurrentDensity: CurrentDensity[] corrupted");
2590	//if (i0<0 \|\| i0>=Dens0->LocalSizeR) Error(SomeError,"FillDeltaCurrentDensity: i0 out of range");
2591	//if ((index+inNDIM)<0 \|\| (index+inNDIM)>=NDIM*NDIM) Error(SomeError,"FillDeltaCurrentDensity: index out of range");
2592	CurrentDensity[index+in*NDIM][i0] += Current; // minus sign is from G_kl
2593	}
2594	}
2595	}
2596	}
2597	}
2598	}
2599	}
2600	}
2601	}
2602	UnLockDensityArray(Dens0,GapDensity,real); // Psi0R
2603	UnLockDensityArray(Dens0,GapLocalDensity,real); // Psip0R
2604	UnLockDensityArray(Dens0,Temp2Density,imag); // Psi1
2605	UnLockDensityArray(Dens0,GapUpDensity,real); // Psi1R
2606	UnLockDensityArray(Dens0,GapDownDensity,real); // Psip1R
2607	// for (i=0;i<Num;i++)
2608	// if (x_l[i] != NULL) Free(x_l[i], "bla", "bla");
2609	// Free(x_l, "bla");
2610	gsl_multimin_fdfminimizer_free (minset);
2611	gsl_vector_free (x);
2612	// gsl_matrix_free(G);
2613	// gsl_permutation_free(p);
2614	// gsl_vector_free(x);
2615	}
2616
2617
2618	/** Evaluates the overlap integral between \a state wave functions.
2619	* \f[
2620	* S_{kl} = \langle \varphi_k^{(1)} \| \varphi_l^{(1)} \rangle
2621	* \f]
2622	* The scalar product is calculated via GradSP(), MPI_Allreduced among comm_ST_Psi and the result
2623	* stored in Psis#Overlap. The rows have to be MPI exchanged, as otherwise processes will add
2624	* to the TotalEnergy overlaps calculated with old wave functions - they have been minimised after
2625	* the product with exchanged coefficients was taken.
2626	* \param *P Problem at hand
2627	* \param l local number of perturbed wave function.
2628	* \param state PsiTypeTag minimisation state of wave functions to be overlapped
2629	*/
2630	void CalculateOverlap(struct Problem *P, const int l, const enum PsiTypeTag state)
2631	{
2632	struct RunStruct *R = &P->R;
2633	struct Lattice *Lat = &(P->Lat);
2634	struct Psis *Psi = &Lat->Psi;
2635	struct LatticeLevel *LevS = R->LevS;
2636	struct OnePsiElement OnePsiB, LOnePsiB;
2637	fftw_complex LPsiDatB=NULL, LPsiDatA=NULL;
2638	const int ElementSize = (sizeof(fftw_complex) / sizeof(double));
2639	int RecvSource;
2640	MPI_Status status;
2641	int i,j,m,p;
2642	//const int l_normal = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[Occupied];
2643	const int ActNum = l - Psi->TypeStartIndex[state] + Psi->TypeStartIndex[1] * Psi->LocalPsiStatus[l].my_color_comm_ST_Psi;
2644	double sendbuf, recvbuf;
2645	double tmp,TMP;
2646	const int gsize = P->Par.Max_me_comm_ST_PsiT; //number of processes in PsiT
2647	int p_num; // number of wave functions (for overlap)
2648
2649	// update overlap table after wave function has changed
2650	LPsiDatA = LevS->LPsi->LocalPsi[l];
2651	m = -1; // to access U matrix element (0..Num-1)
2652	for (j=0; j < Psi->MaxPsiOfType+P->Par.Max_me_comm_ST_PsiT; j++) { // go through all wave functions
2653	OnePsiB = &Psi->AllPsiStatus[j]; // grab OnePsiB
2654	if (OnePsiB->PsiType == state) { // drop all but the ones of current min state
2655	m++; // increase m if it is non-extra wave function
2656	if (OnePsiB->my_color_comm_ST_Psi == P->Par.my_color_comm_ST_Psi) // local?
2657	LOnePsiB = &Psi->LocalPsiStatus[OnePsiB->MyLocalNo];
2658	else
2659	LOnePsiB = NULL;
2660	if (LOnePsiB == NULL) { // if it's not local ... receive it from respective process into TempPsi
2661	RecvSource = OnePsiB->my_color_comm_ST_Psi;
2662	MPI_Recv( LevS->LPsi->TempPsi, LevS->MaxG*ElementSize, MPI_DOUBLE, RecvSource, OverlapTag, P->Par.comm_ST_PsiT, &status );
2663	LPsiDatB=LevS->LPsi->TempPsi;
2664	} else { // .. otherwise send it to all other processes (Max_me... - 1)
2665	for (p=0;p<P->Par.Max_me_comm_ST_PsiT;p++)
2666	if (p != OnePsiB->my_color_comm_ST_Psi)
2667	MPI_Send( LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo], LevS->MaxG*ElementSize, MPI_DOUBLE, p, OverlapTag, P->Par.comm_ST_PsiT);
2668	LPsiDatB=LevS->LPsi->LocalPsi[OnePsiB->MyLocalNo];
2669	} // LPsiDatB is now set to the coefficients of OnePsi either stored or MPI_Received
2670
2671	tmp = GradSP(P, LevS, LPsiDatA, LPsiDatB) * sqrt(Psi->LocalPsiStatus[l].PsiFactor * OnePsiB->PsiFactor);
2672	MPI_Allreduce ( &tmp, &TMP, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi);
2673	//fprintf(stderr,"(%i) Setting Overlap [%i][%i] = %lg\n",P->Par.me, ActNum,m,TMP);
2674	Psi->Overlap[ActNum][m] = TMP; //= Psi->Overlap[m][ActNum]
2675	}
2676	}
2677
2678	// exchange newly calculated rows among PsiT
2679	p_num = (m+1) + 1; // number of Psis: one more due to ActNum
2680	sendbuf = (double ) Malloc(p_num sizeof(double), "CalculateOverlap: sendbuf");
2681	sendbuf[0] = ActNum; // first entry is the global row number
2682	for (i=1;i<p_num;i++)
2683	sendbuf[i] = Psi->Overlap[ActNum][i-1]; // then follow up each entry of overlap row
2684	recvbuf = (double ) Malloc(gsize p_num * sizeof(double), "CalculateOverlap: recvbuf");
2685	MPI_Allgather(sendbuf, p_num, MPI_DOUBLE, recvbuf, p_num, MPI_DOUBLE, P->Par.comm_ST_PsiT);
2686	Free(sendbuf, "bla");
2687	for (i=0;i<gsize;i++) {// extract results from other processes out of receiving buffer
2688	m = recvbuf[i*p_num]; // m is ActNum of the process whose results we've just received
2689	//fprintf(stderr,"(%i) Received row %i from process %i\n", P->Par.me, m, i);
2690	for (j=1;j<p_num;j++)
2691	Psi->Overlap[m][j-1] = Psi->Overlap[j-1][m] = recvbuf[i*p_num+j]; // put each entry into correspondent Overlap row
2692	}
2693	Free(recvbuf, "bla");
2694	}
2695
2696
2697	/** Calculates magnetic susceptibility from known current density.
2698	* The bulk susceptibility tensor can be expressed as a function of the current density.
2699	* \f[
2700	* \chi_{ij} = \frac{\mu_0}{2\Omega} \frac{\delta}{\delta B_i^{ext}} \int_\Omega d^3 r \left (r \times j(r) \right )_j
2701	* \f]
2702	* Thus the integral over real space and subsequent MPI_Allreduce() over results from ParallelSimulationData#comm_ST_Psi is
2703	* straightforward. Tensor is diagonalized afterwards and split into its various sub-tensors of lower rank (e.g., isometric
2704	* value is tensor of rank 0) which are printed to screen and the tensorial elements to file '....chi.csv'
2705	* \param *P Problem at hand
2706	*/
2707	void CalculateMagneticSusceptibility(struct Problem *P)
2708	{
2709	struct RunStruct *R = &P->R;
2710	struct Lattice *Lat = &P->Lat;
2711	struct LatticeLevel *Lev0 = R->Lev0;
2712	struct Density *Dens0 = R->Lev0->Dens;
2713	struct Ions *I = &P->Ion;
2714	fftw_real CurrentDensity[NDIMNDIM];
2715	int in, dex, i, i0, n0;
2716	int n[NDIM];
2717	const int N0 = Lev0->Plan0.plan->local_nx;
2718	int N[NDIM];
2719	N[0] = Lev0->Plan0.plan->N[0];
2720	N[1] = Lev0->Plan0.plan->N[1];
2721	N[2] = Lev0->Plan0.plan->N[2];
2722	double chi[NDIMNDIM],Chi[NDIMNDIM], x[NDIM], fac[NDIM];
2723	const double discrete_factor = Lat->Volume/Lev0->MaxN;
2724	const int myPE = P->Par.me_comm_ST_Psi;
2725	double eta, delta_chi, S, A, iso;
2726	int cross_lookup[4];
2727	char filename[256];
2728	FILE *ChiFile;
2729	time_t seconds;
2730	time(&seconds); // get current time
2731
2732	// set pointers onto current density
2733	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
2734	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
2735	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
2736	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
2737	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
2738	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
2739	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
2740	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
2741	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
2742	//for(i=0;i<NDIM;i++) {
2743	// field[i] = Dens0->DensityArray[TempDensity+i];
2744	//LockDensityArray(Dens0,TempDensity+i,real);
2745	// SetArrayToDouble0((double )field[i],Dens0->TotalSize2);
2746	//}
2747	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
2748
2749
2750	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) magnetic susceptibility tensor \\Chi_ij = \n",P->Par.me);
2751	for (in=0; in<NDIM; in++) { // index i of integrand vector component
2752	for(dex=0;dex<4;dex++) // initialise cross lookup
2753	cross_lookup[dex] = cross(in,dex);
2754	for (dex=0; dex<NDIM; dex++) { // index j of derivation wrt B field
2755	chi[in+dex*NDIM] = 0.;
2756	// do the integration over real space
2757	for(n0=0;n0<N0;n0++)
2758	for(n[1]=0;n[1]<N[1];n[1]++)
2759	for(n[2]=0;n[2]<N[2];n[2]++) {
2760	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
2761	fac[0] = (double)(n[0])/(double)N[0];
2762	fac[1] = (double)(n[1])/(double)N[1];
2763	fac[2] = (double)(n[2])/(double)N[2];
2764	RMat33Vec3(x, Lat->RealBasis, fac);
2765	i0 = n[2]+N[2](n[1]+N[1](n0)); // the index of current density must match LocalSizeR!
2766	chi[in+dexNDIM] += MinImageConv(Lat,x[cross_lookup[0]], sqrt(Lat->RealBasisSQ[cross_lookup[0]])/2.,cross_lookup[0]) CurrentDensity[dex*NDIM+cross_lookup[1]][i0]; // x[cross(in,0)], sqrt(Lat->RealBasisSQ[cross_lookup[0]])/2.
2767	chi[in+dexNDIM] -= MinImageConv(Lat,x[cross_lookup[2]], sqrt(Lat->RealBasisSQ[cross_lookup[2]])/2.,cross_lookup[2]) CurrentDensity[dex*NDIM+cross_lookup[3]][i0]; // x[cross(in,2)], sqrt(Lat->RealBasisSQ[cross_lookup[2]])/2.
2768	// if (in == dex) field[in][i0] =
2769	// truedist(Lat,x[cross_lookup[0]], sqrt(Lat->RealBasisSQ[c[0]])/2.,cross_lookup[0]) * CurrentDensity[dex*NDIM+cross_lookup[1]][i0]
2770	// - truedist(Lat,x[cross_lookup[2]], sqrt(Lat->RealBasisSQ[c[2]])/2.,cross_lookup[2]) * CurrentDensity[dex*NDIM+cross_lookup[3]][i0];
2771	//fprintf(stderr,"(%i) temporary susceptiblity \\chi[%i][%i] += %e * %e = r[%i] * CurrDens[%i][%i] = %e\n",P->Par.me,in,dex,(double)n[cross_lookup[0]]/(double)N[cross_lookup[0]](sqrt(Lat->RealBasisSQ[cross_lookup[0]])),CurrentDensity[dexNDIM+cross_lookup[1]][i0],cross_lookup[0],dexNDIM+cross_lookup[1],i0,chi[inNDIM+dex]);
2772	}
2773	chi[in+dexNDIM] = mu0discrete_factor/(2.Lat->Volume); // integral factor
2774	chi[in+dexNDIM] = (-1625.); // empirical gauge factor ... sigh
2775	MPI_Allreduce ( &chi[in+dexNDIM], &Chi[in+dexNDIM], 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
2776	I->I[0].chi[in+dexNDIM] = Chi[in+dexNDIM];
2777	Chi[in+dexNDIM] = Lat->Volume*loschmidt_constant; // factor for _molar_ susceptibility
2778	if (P->Call.out[ValueOut]) {
2779	fprintf(stderr,"%e\t", Chi[in+dex*NDIM]);
2780	if (dex == NDIM-1) fprintf(stderr,"\n");
2781	}
2782	}
2783	}
2784	// store symmetrized matrix
2785	for (in=0;in<NDIM;in++)
2786	for (dex=0;dex<NDIM;dex++)
2787	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((Chi[in+dexNDIM]+Chi[dex+inNDIM])/2.,0));
2788	// output tensor to file
2789	if (P->Par.me == 0) {
2790	sprintf(filename, ".chi.L%i.csv", Lev0->LevelNo);
2791	OpenFile(P, &ChiFile, filename, "a", P->Call.out[ReadOut]);
2792	fprintf(ChiFile,"# magnetic susceptibility tensor chi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
2793	fprintf(ChiFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
2794	for (in=0;in<NDIM*NDIM;in++)
2795	fprintf(ChiFile,"%e\t", Chi[in]);
2796	fprintf(ChiFile,"\n");
2797	fclose(ChiFile);
2798	}
2799	// diagonalize chi
2800	gsl_vector *eval = gsl_vector_alloc(NDIM);
2801	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
2802	gsl_eigen_herm(H, eval, w);
2803	gsl_eigen_herm_free(w);
2804	gsl_sort_vector(eval); // sort eigenvalues
2805	// print eigenvalues
2806	iso = 0;
2807	for (i=0;i<NDIM;i++) {
2808	I->I[0].chi_PAS[i] = gsl_vector_get(eval,i);
2809	iso += Chi[i+i*NDIM]/3.;
2810	}
2811	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
2812	delta_chi = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
2813	S = (delta_chidelta_chi)(1+1./3.etaeta);
2814	A = 0.;
2815	for (i=0;i<NDIM;i++) {
2816	in = cross(i,0);
2817	dex = cross(i,1);
2818	A += pow(-1,i)pow(0.5(Chi[in+dexNDIM]-Chi[dex+inNDIM]),2);
2819	}
2820	if (P->Call.out[ValueOut]) {
2821	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
2822	for (i=0;i<NDIM;i++)
2823	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
2824	fprintf(stderr,"\nsusceptib. : %e\n", iso);
2825	fprintf(stderr,"anisotropy : %e\n", delta_chi);
2826	fprintf(stderr,"asymmetry : %e\n", eta);
2827	fprintf(stderr,"S : %e\n", S);
2828	fprintf(stderr,"A : %e\n", A);
2829	fprintf(stderr,"==================\n");
2830	}
2831	//for(i=0;i<NDIM;i++)
2832	//UnLockDensityArray(Dens0,TempDensity+i,real);
2833	gsl_vector_free(eval);
2834	gsl_matrix_complex_free(H);
2835	}
2836
2837	/** Fouriertransforms all nine current density components and calculates shielding tensor.
2838	* \f[
2839	* \sigma_{ij} = \left ( \frac{G}{\|G\|^2} \times J_i(G) \right )_j
2840	* \f]
2841	* The CurrentDensity has to be fouriertransformed to reciprocal subspace in order to be useful, and the final
2842	* product \f$\sigma_{ij}(G)\f$ has to be back-transformed to real space. However, the shielding is the only evaluated
2843	* at the grid points and not where the real ion position is. The shieldings there are interpolated between the eight
2844	* adjacent grid points by a simple linear weighting. Afterwards follows the same analaysis and printout of the rank-2-tensor
2845	* as in the case of CalculateMagneticShielding().
2846	* \param *P Problem at hand
2847	* \note Lots of arrays are used temporarily during the routine for the fft'ed Current density tensor.
2848	* \note MagneticSusceptibility is needed for G=0-component and thus has to be computed beforehand
2849	*/
2850	void CalculateChemicalShieldingByReciprocalCurrentDensity(struct Problem *P)
2851	{
2852	struct RunStruct *R = &P->R;
2853	struct Lattice *Lat = &P->Lat;
2854	struct LatticeLevel *Lev0 = R->Lev0;
2855	struct Ions *I = &P->Ion;
2856	struct Density *Dens0 = Lev0->Dens;
2857	struct OneGData *GArray = Lev0->GArray;
2858	struct fft_plan_3d *plan = Lat->plan;
2859	fftw_real CurrentDensity[NDIMNDIM];
2860	fftw_complex CurrentDensityC[NDIMNDIM];
2861	fftw_complex work = (fftw_complex )Dens0->DensityCArray[TempDensity];
2862	//fftw_complex sigma_imag = (fftw_complex )Dens0->DensityCArray[Temp2Density];
2863	//fftw_real sigma_real = (fftw_real )sigma_imag;
2864	fftw_complex *sigma_imag[NDIM_NDIM];
2865	fftw_real *sigma_real[NDIM_NDIM];
2866	double sigma,Sigma;
2867	int it, ion, in, dex, g, n[2][NDIM], Index, i;
2868	//const double FFTfactor = 1.;///Lev0->MaxN;
2869	double eta, delta_sigma, S, A, iso, tmp;
2870	FILE *SigmaFile;
2871	char suffixsigma[255];
2872	double x[2][NDIM];
2873	const int myPE = P->Par.me_comm_ST_Psi;
2874	int N[NDIM];
2875	int cross_lookup[4]; // cross lookup table
2876	N[0] = Lev0->Plan0.plan->N[0];
2877	N[1] = Lev0->Plan0.plan->N[1];
2878	N[2] = Lev0->Plan0.plan->N[2];
2879	const int N0 = Lev0->Plan0.plan->local_nx;
2880	const double factorDC = R->FactorDensityC;
2881	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
2882
2883	time_t seconds;
2884	time(&seconds); // get current time
2885
2886	// inverse Fourier transform current densities
2887	CurrentDensityC[0] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity0];
2888	CurrentDensityC[1] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity1];
2889	CurrentDensityC[2] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity2];
2890	CurrentDensityC[3] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity3];
2891	CurrentDensityC[4] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity4];
2892	CurrentDensityC[5] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity5];
2893	CurrentDensityC[6] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity6];
2894	CurrentDensityC[7] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity7];
2895	CurrentDensityC[8] = (fftw_complex *) Dens0->DensityCArray[CurrentDensity8];
2896	// don't put the following stuff into a for loop, they are not continuous! (preprocessor values CurrentDensity.)
2897	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
2898	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
2899	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
2900	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
2901	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
2902	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
2903	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
2904	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
2905	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
2906
2907	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Checking J_{ij} (G=0) = 0 for each i,j ... \n",P->Par.me);
2908	for (in=0;in<NDIM*NDIM;in++) {
2909	CalculateOneDensityC(Lat, R->LevS, Dens0, CurrentDensity[in], CurrentDensityC[in], factorDC);
2910	tmp = sqrt(CurrentDensityC[in][0].reCurrentDensityC[in][0].re+CurrentDensityC[in][0].imCurrentDensityC[in][0].im);
2911	if (GArray[0].GSq < MYEPSILON) {
2912	if (in % NDIM == 0) fprintf(stderr,"(%i) ",P->Par.me);
2913	if (tmp > MYEPSILON) {
2914	fprintf(stderr,"J_{%i,%i} = \|%e + i%e\| < %e ? (%e)\t", in / NDIM, in%NDIM, CurrentDensityC[in][0].re, CurrentDensityC[in][0].im, MYEPSILON, tmp - MYEPSILON);
2915	} else {
2916	fprintf(stderr,"J_{%i,%i} ok\t", in / NDIM, in%NDIM);
2917	}
2918	if (in % NDIM == (NDIM-1)) fprintf(stderr,"\n");
2919	}
2920	}
2921
2922	for (in=0;in<NDIM*NDIM;in++) {
2923	LockDensityArray(Dens0,in,real); // Psi1R
2924	sigma_imag[in] = (fftw_complex *) Dens0->DensityArray[in];
2925	sigma_real[in] = (fftw_real *) sigma_imag[in];
2926	}
2927
2928	LockDensityArray(Dens0,TempDensity,imag); // work
2929	LockDensityArray(Dens0,Temp2Density,imag); // tempdestRC and field
2930	// go through reciprocal nodes and calculate shielding tensor sigma
2931	for (in=0; in<NDIM; in++) {// index i of vector component in integrand
2932	for(dex=0;dex<4;dex++) // initialise cross lookup
2933	cross_lookup[dex] = cross(in,dex);
2934	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
2935	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
2936	SetArrayToDouble0((double )sigma_imag[in+dexNDIM],Dens0->TotalSize*2);
2937	for (g=0; g < Lev0->MaxG; g++)
2938	if (GArray[g].GSq > MYEPSILON) { // skip due to divisor
2939	Index = GArray[g].Index; // re = im, im = -re due to "i" in formula
2940	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density] \|\| Index<0 \|\| Index>=Dens0->LocalSizeC) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
2941	sigma_imag[in+dexNDIM][Index].re = GArray[g].G[cross_lookup[0]] (-CurrentDensityC[dexNDIM+cross_lookup[1]][Index].im)/GArray[g].GSq;//FFTfactor;
2942	sigma_imag[in+dexNDIM][Index].re -= GArray[g].G[cross_lookup[2]] (-CurrentDensityC[dexNDIM+cross_lookup[3]][Index].im)/GArray[g].GSq;//FFTfactor;
2943	sigma_imag[in+dexNDIM][Index].im = GArray[g].G[cross_lookup[0]] ( CurrentDensityC[dexNDIM+cross_lookup[1]][Index].re)/GArray[g].GSq;//FFTfactor;
2944	sigma_imag[in+dexNDIM][Index].im -= GArray[g].G[cross_lookup[2]] ( CurrentDensityC[dexNDIM+cross_lookup[3]][Index].re)/GArray[g].GSq;//FFTfactor;
2945	} else { // G=0-component stems from magnetic susceptibility
2946	sigma_imag[in+dexNDIM][GArray[g].Index].re = 2./3.I->I[0].chi[in+dexNDIM];//-4.M_PI(0.5I->I[0].chi[0+0NDIM]+0.5I->I[0].chi[1+1NDIM]+2./3.I->I[0].chi[2+2*NDIM]);
2947	}
2948	for (g=0; g<Lev0->MaxDoubleG; g++) { // apply symmetry
2949	//if (tempdestRC != (fftw_complex )Dens0->DensityCArray[Temp2Density] \|\| Lev0->DoubleG[2g+1]<0 \|\| Lev0->DoubleG[2*g+1]>=Dens0->LocalSizeC) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
2950	sigma_imag[in+dexNDIM][Lev0->DoubleG[2g+1]].re = sigma_imag[in+dexNDIM][Lev0->DoubleG[2g]].re;
2951	sigma_imag[in+dexNDIM][Lev0->DoubleG[2g+1]].im = -sigma_imag[in+dexNDIM][Lev0->DoubleG[2g]].im;
2952	}
2953	// fourier transformation of sigma
2954	//if (tempdestRC != (fftw_complex *)Dens0->DensityCArray[Temp2Density]) Error(SomeError,"CalculateChemicalShieldingByReciprocalCurrentDensity: tempdestRC corrupted");
2955	fft_3d_complex_to_real(plan, Lev0->LevelNo, FFTNF1, sigma_imag[in+dex*NDIM], work);
2956
2957	for (it=0; it < I->Max_Types; it++) { // integration over all types
2958	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
2959	// read transformed sigma at core position and MPI_Allreduce
2960	for (g=0;g<NDIM;g++) {
2961	n[0][g] = floor(I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g]);
2962	n[1][g] = ceil(I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g]);
2963	x[1][g] = I->I[it].R[NDIMion+g]/sqrt(Lat->RealBasisSQ[g])(double)N[g] - (double)n[0][g];
2964	x[0][g] = 1. - x[1][g];
2965	//fprintf(stderr,"(%i) n_floor[%i] = %i\tn_ceil[%i] = %i --- x_floor[%i] = %e\tx_ceil[%i] = %e\n",P->Par.me, g,n[0][g], g,n[1][g], g,x[0][g], g,x[1][g]);
2966	}
2967	sigma = 0.;
2968	for (i=0;i<2;i++) { // interpolate linearly between adjacent grid points per axis
2969	if ((n[i][0] >= N0myPE) && (n[i][0] < N0(myPE+1))) {
2970	// fprintf(stderr,"(%i) field[%i]: sigma = %e\n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0*myPE)), sigma);
2971	sigma += (x[i][0]x[0][1]x[0][2])sigma_real[in+dexNDIM][n[0][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
2972	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[0][1]x[0][2]), field[n[0][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]*mu0);
2973	sigma += (x[i][0]x[0][1]x[1][2])sigma_real[in+dexNDIM][n[1][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
2974	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[0][1]x[1][2]), field[n[1][2]+N[2](n[0][1]+N[1](n[i][0]-N0myPE))]*mu0);
2975	sigma += (x[i][0]x[1][1]x[0][2])sigma_real[in+dexNDIM][n[0][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
2976	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[1][1]x[0][2]), field[n[0][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]*mu0);
2977	sigma += (x[i][0]x[1][1]x[1][2])sigma_real[in+dexNDIM][n[1][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]mu0; // if it's local and factor from inverse fft
2978	//fprintf(stderr,"(%i) field[%i]: sigma += %e * %e \n", P->Par.me, n[i][2]+N[2](n[i][1]+N[1](n[i][0]-N0myPE)), (x[i][0]x[1][1]x[1][2]), field[n[1][2]+N[2](n[1][1]+N[1](n[i][0]-N0myPE))]*mu0);
2979	}
2980	}
2981	sigma *= -R->FactorDensityR; // factor from inverse fft? (and its defined as negative proportionaly factor)
2982	MPI_Allreduce ( &sigma, &Sigma, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum local to total
2983	I->I[it].sigma_rezi[ion][in+dex*NDIM] = Sigma;
2984	}
2985	}
2986	// fabs() all sigma values, as we need them as a positive density: OutputVis plots them in logarithmic scale and
2987	// thus cannot deal with negative values!
2988	for (i=0; i< Dens0->LocalSizeR; i++)
2989	sigma_real[in+dexNDIM][i] = fabs(sigma_real[in+dexNDIM][i]);
2990	}
2991	}
2992	UnLockDensityArray(Dens0,TempDensity,imag); // work
2993	UnLockDensityArray(Dens0,Temp2Density,imag); // tempdestRC and field
2994
2995	// output tensor to file
2996	if (P->Par.me == 0) {
2997	sprintf(&suffixsigma[0], ".sigma_chi_rezi.L%i.csv", Lev0->LevelNo);
2998	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
2999	fprintf(SigmaFile,"# chemical shielding tensor sigma_rezi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
3000	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
3001	for (in=0;in<NDIM;in++)
3002	for (dex=0;dex<NDIM;dex++)
3003	fprintf(SigmaFile,"%e\t", GSL_REAL(gsl_matrix_complex_get(H,in,dex)));
3004	fprintf(SigmaFile,"\n");
3005	fclose(SigmaFile);
3006	}
3007
3008	gsl_vector *eval = gsl_vector_alloc(NDIM);
3009	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
3010
3011	for (it=0; it < I->Max_Types; it++) { // integration over all types
3012	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
3013	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) Shielding Tensor for Ion %i of element %s \\sigma_ij = \n",P->Par.me, ion, I->I[it].Name);
3014	for (in=0; in<NDIM; in++) { // index i of vector component in integrand
3015	for (dex=0; dex<NDIM; dex++) {// index j of B component derivation in current density tensor
3016	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((I->I[it].sigma_rezi[ion][in+dexNDIM]+I->I[it].sigma_rezi[ion][dex+inNDIM])/2.,0));
3017	if (P->Call.out[ValueOut]) fprintf(stderr,"%e\t", I->I[it].sigma_rezi[ion][in+dex*NDIM]);
3018	}
3019	if (P->Call.out[ValueOut]) fprintf(stderr,"\n");
3020	}
3021	// output tensor to file
3022	if (P->Par.me == 0) {
3023	sprintf(&suffixsigma[0], ".sigma_i%i_%s_rezi.L%i.csv", ion, I->I[it].Symbol, Lev0->LevelNo);
3024	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
3025	fprintf(SigmaFile,"# chemical shielding tensor sigma_rezi[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
3026	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
3027	for (in=0;in<NDIM;in++)
3028	for (dex=0;dex<NDIM;dex++)
3029	fprintf(SigmaFile,"%e\t", I->I[it].sigma_rezi[ion][in+dex*NDIM]);
3030	fprintf(SigmaFile,"\n");
3031	fclose(SigmaFile);
3032	}
3033	// diagonalize sigma
3034	gsl_eigen_herm(H, eval, w);
3035	gsl_sort_vector(eval); // sort eigenvalues
3036	// print eigenvalues
3037	// if (P->Call.out[ValueOut]) {
3038	// fprintf(stderr,"(%i) diagonal shielding for Ion %i of element %s:", P->Par.me, ion, I->I[it].Name);
3039	// for (in=0;in<NDIM;in++)
3040	// fprintf(stderr,"\t%lg",gsl_vector_get(eval,in));
3041	// fprintf(stderr,"\n\n");
3042	// }
3043	iso = 0.;
3044	for (i=0;i<NDIM;i++) {
3045	I->I[it].sigma_rezi_PAS[ion][i] = gsl_vector_get(eval,i);
3046	iso += I->I[it].sigma_rezi[ion][i+i*NDIM]/3.;
3047	}
3048	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
3049	delta_sigma = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
3050	S = (delta_sigmadelta_sigma)(1+1./3.etaeta);
3051	A = 0.;
3052	for (i=0;i<NDIM;i++) {
3053	in = cross(i,0);
3054	dex = cross(i,1);
3055	A += pow(-1,i)pow(0.5(I->I[it].sigma_rezi[ion][in+dexNDIM]-I->I[it].sigma_rezi[ion][dex+inNDIM]),2);
3056	}
3057	if (P->Call.out[ValueOut]) {
3058	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
3059	for (i=0;i<NDIM;i++)
3060	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
3061	fprintf(stderr,"\nshielding : %e\n", iso);
3062	fprintf(stderr,"anisotropy : %e\n", delta_sigma);
3063	fprintf(stderr,"asymmetry : %e\n", eta);
3064	fprintf(stderr,"S : %e\n", S);
3065	fprintf(stderr,"A : %e\n", A);
3066	fprintf(stderr,"==================\n");
3067
3068	}
3069	}
3070	}
3071
3072	// Output of magnetic field densities for each direction
3073	for (i=0;i<NDIM*NDIM;i++)
3074	OutputVis(P, sigma_real[i]);
3075	// Diagonalizing the tensor "field" B_ij [r]
3076	fprintf(stderr,"(%i) Diagonalizing B_ij [r] ... \n", P->Par.me);
3077	for (i=0; i< Dens0->LocalSizeR; i++) {
3078	for (in=0; in<NDIM; in++) // index i of vector component in integrand
3079	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
3080	//fprintf(stderr,"(%i) Setting B_(%i,%i)[%i] ... \n", P->Par.me, in,dex,i);
3081	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((sigma_real[in+dexNDIM][i]+sigma_real[dex+inNDIM][i])/2.,0));
3082	}
3083	gsl_eigen_herm(H, eval, w);
3084	gsl_sort_vector(eval); // sort eigenvalues
3085	for (in=0;in<NDIM;in++)
3086	sigma_real[in][i] = gsl_vector_get(eval,in);
3087	}
3088	// Output of diagonalized magnetic field densities for each direction
3089	for (i=0;i<NDIM;i++)
3090	OutputVis(P, sigma_real[i]);
3091	for (i=0;i<NDIM*NDIM;i++)
3092	UnLockDensityArray(Dens0,i,real); // sigma_imag/real free
3093
3094	gsl_eigen_herm_free(w);
3095	gsl_vector_free(eval);
3096	gsl_matrix_complex_free(H);
3097	}
3098
3099
3100	/** Calculates the chemical shielding tensor at the positions of the nuclei.
3101	* The chemical shielding tensor at position R is defined as the proportionality factor between the induced and
3102	* the externally applied field.
3103	* \f[
3104	* \sigma_{ij} (R) = \frac{\delta B_j^{ind} (R)}{\delta B_i^{ext}}
3105	* = \frac{\mu_0}{4 \pi} \int d^3 r' \left ( \frac{r'-r}{\| r' - r \|^3} \times J_i (r') \right )_j
3106	* \f]
3107	* One after another for each nuclear position is the tensor evaluated and the result printed
3108	* to screen. Tensor is diagonalized afterwards.
3109	* \param *P Problem at hand
3110	* \sa CalculateMagneticSusceptibility() - similar calculation, yet without translation to ion centers.
3111	* \warning This routine is out-dated due to being numerically unstable because of the singularity which is not
3112	* considered carefully, recommendend replacement is CalculateChemicalShieldingByReciprocalCurrentDensity().
3113	*/
3114	void CalculateChemicalShielding(struct Problem *P)
3115	{
3116	struct RunStruct *R = &P->R;
3117	struct Lattice *Lat = &P->Lat;
3118	struct LatticeLevel *Lev0 = R->Lev0;
3119	struct Density *Dens0 = R->Lev0->Dens;
3120	struct Ions *I = &P->Ion;
3121	double sigma[NDIMNDIM],Sigma[NDIMNDIM];
3122	fftw_real CurrentDensity[NDIMNDIM];
3123	int it, ion, in, dex, i0, n[NDIM], n0, i;//, *NUp;
3124	double x,y,z;
3125	double dist;
3126	double r[NDIM], fac[NDIM];
3127	const double discrete_factor = Lat->Volume/Lev0->MaxN;
3128	double eta, delta_sigma, S, A, iso;
3129	const int myPE = P->Par.me_comm_ST_Psi;
3130	int N[NDIM];
3131	N[0] = Lev0->Plan0.plan->N[0];
3132	N[1] = Lev0->Plan0.plan->N[1];
3133	N[2] = Lev0->Plan0.plan->N[2];
3134	const int N0 = Lev0->Plan0.plan->local_nx;
3135	FILE *SigmaFile;
3136	char suffixsigma[255];
3137	time_t seconds;
3138	time(&seconds); // get current time
3139
3140	// set pointers onto current density
3141	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
3142	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
3143	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
3144	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
3145	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
3146	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
3147	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
3148	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
3149	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
3150	gsl_matrix_complex *H = gsl_matrix_complex_calloc(NDIM,NDIM);
3151
3152	for (it=0; it < I->Max_Types; it++) { // integration over all types
3153	for (ion=0; ion < I->I[it].Max_IonsOfType; ion++) { // and each ion of type
3154	if (P->Call.out[ValueOut]) fprintf(stderr,"(%i) Shielding Tensor for Ion %i of element %s \\sigma_ij = \n",P->Par.me, ion, I->I[it].Name);
3155	for (in=0; in<NDIM; in++) {// index i of vector component in integrand
3156	for (dex=0; dex<NDIM; dex++) { // index j of B component derivation in current density tensor
3157	sigma[in+dex*NDIM] = 0.;
3158
3159	for(n0=0;n0<N0;n0++) // do the integration over real space
3160	for(n[1]=0;n[1]<N[1];n[1]++)
3161	for(n[2]=0;n[2]<N[2];n[2]++) {
3162	n[0]=n0 + N0*myPE; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
3163	fac[0] = (double)n[0]/(double)N[0];
3164	fac[1] = (double)n[1]/(double)N[1];
3165	fac[2] = (double)n[2]/(double)N[2];
3166	RMat33Vec3(r, Lat->RealBasis, fac);
3167	i0 = n[2]+N[2](n[1]+N[1](n0)); // the index of current density must match LocalSizeR!
3168	x = MinImageConv(Lat,r[cross(in,0)], I->I[it].R[NDIM*ion+cross(in,0)],cross(in,0));
3169	y = MinImageConv(Lat,r[cross(in,2)], I->I[it].R[NDIM*ion+cross(in,2)],cross(in,2));
3170	z = MinImageConv(Lat,r[in], I->I[it].R[NDIM*ion+in],in); // "in" always is missing third component in cross product
3171	dist = pow(xx + yy + z*z, 3./2.);
3172	if ((dist < pow(2.,3.)) && (dist > MYEPSILON)) sigma[in+dexNDIM] += (x CurrentDensity[dexNDIM+cross(in,1)][i0] - y CurrentDensity[dex*NDIM+cross(in,3)][i0])/dist;
3173	//if (it == 0 && ion == 0) fprintf(stderr,"(%i) sigma[%i][%i] += (%e * %e - %e * %e)/%e = %e\n", P->Par.me, in, dex, x,CurrentDensity[dexNDIM+cross(in,1)][i0],y,CurrentDensity[dexNDIM+cross(in,3)][i0],dist,sigma[in+dex*NDIM]);
3174	}
3175	sigma[in+dexNDIM] = -mu0discrete_factor/(4.PI); // due to summation instead of integration
3176	MPI_Allreduce ( &sigma[in+dexNDIM], &Sigma[in+dexNDIM], 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
3177	I->I[it].sigma[ion][in+dexNDIM] = Sigma[in+dexNDIM];
3178	if (P->Call.out[ValueOut]) fprintf(stderr," %e", Sigma[in+dex*NDIM]);
3179	}
3180	if (P->Call.out[ValueOut]) fprintf(stderr,"\n");
3181	}
3182	// store symmetrized matrix
3183	for (in=0;in<NDIM;in++)
3184	for (dex=0;dex<NDIM;dex++)
3185	gsl_matrix_complex_set(H,in,dex,gsl_complex_rect((Sigma[in+dexNDIM]+Sigma[dex+inNDIM])/2.,0));
3186	// output tensor to file
3187	if (P->Par.me == 0) {
3188	sprintf(&suffixsigma[0], ".sigma_i%i_%s.L%i.csv", ion, I->I[it].Symbol, Lev0->LevelNo);
3189	OpenFile(P, &SigmaFile, suffixsigma, "a", P->Call.out[ReadOut]);
3190	fprintf(SigmaFile,"# chemical shielding tensor sigma[01,02,03,10,11,12,20,21,22], seed %i, config %s, run on %s", R->Seed, P->Files.default_path, ctime(&seconds));
3191	fprintf(SigmaFile,"%lg\t", P->Lat.ECut/(Lat->LevelSizes[0]*Lat->LevelSizes[0]));
3192	for (in=0;in<NDIM*NDIM;in++)
3193	fprintf(SigmaFile,"%e\t", Sigma[in]);
3194	fprintf(SigmaFile,"\n");
3195	fclose(SigmaFile);
3196	}
3197	// diagonalize sigma
3198	gsl_vector *eval = gsl_vector_alloc(NDIM);
3199	gsl_eigen_herm_workspace *w = gsl_eigen_herm_alloc(NDIM);
3200	gsl_eigen_herm(H, eval, w);
3201	gsl_eigen_herm_free(w);
3202	gsl_sort_vector(eval); // sort eigenvalues
3203	// print eigenvalues
3204	// if (P->Call.out[ValueOut]) {
3205	// fprintf(stderr,"(%i) diagonal shielding for Ion %i of element %s:", P->Par.me, ion, I->I[it].Name);
3206	// for (in=0;in<NDIM;in++)
3207	// fprintf(stderr,"\t%lg",gsl_vector_get(eval,in));
3208	// fprintf(stderr,"\n\n");
3209	// }
3210	// print eigenvalues
3211	iso = 0;
3212	for (i=0;i<NDIM;i++) {
3213	I->I[it].sigma[ion][i] = gsl_vector_get(eval,i);
3214	iso += Sigma[i+i*NDIM]/3.;
3215	}
3216	eta = (gsl_vector_get(eval,1)-gsl_vector_get(eval,0))/(gsl_vector_get(eval,2)-iso);
3217	delta_sigma = gsl_vector_get(eval,2) - 0.5*(gsl_vector_get(eval,0)+gsl_vector_get(eval,1));
3218	S = (delta_sigmadelta_sigma)(1+1./3.etaeta);
3219	A = 0.;
3220	for (i=0;i<NDIM;i++) {
3221	in = cross(i,0);
3222	dex = cross(i,1);
3223	A += pow(-1,i)pow(0.5(Sigma[in+dexNDIM]-Sigma[dex+inNDIM]),2);
3224	}
3225	if (P->Call.out[ValueOut]) {
3226	fprintf(stderr,"(%i) converted to Principal Axis System\n==================\nDiagonal entries:", P->Par.me);
3227	for (i=0;i<NDIM;i++)
3228	fprintf(stderr,"\t%lg",gsl_vector_get(eval,i));
3229	fprintf(stderr,"\nshielding : %e\n", iso);
3230	fprintf(stderr,"anisotropy : %e\n", delta_sigma);
3231	fprintf(stderr,"asymmetry : %e\n", eta);
3232	fprintf(stderr,"S : %e\n", S);
3233	fprintf(stderr,"A : %e\n", A);
3234	fprintf(stderr,"==================\n");
3235
3236	}
3237	gsl_vector_free(eval);
3238	}
3239	}
3240
3241	gsl_matrix_complex_free(H);
3242	}
3243
3244	/** Test if integrated current over cell is 0.
3245	* In most cases we do not reach a numerical sensible zero as in MYEPSILON and remain satisfied as long
3246	* as the integrated current density is very small (e.g. compared to single entries in the current density array)
3247	* \param *P Problem at hand
3248	* \param index index of current component
3249	* \sa CalculateNativeIntDens() for integration of one current tensor component
3250	*/
3251	void TestCurrent(struct Problem *P, const int index)
3252	{
3253	struct RunStruct *R = &P->R;
3254	struct LatticeLevel *Lev0 = R->Lev0;
3255	struct Density *Dens0 = Lev0->Dens;
3256	fftw_real CurrentDensity[NDIMNDIM];
3257	int in;
3258	double result[NDIM*NDIM], res = 0.;
3259
3260	// set pointers onto current density array and get number of grid points in each direction
3261	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
3262	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
3263	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
3264	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
3265	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
3266	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
3267	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
3268	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
3269	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
3270	for(in=0;in<NDIM;in++) {
3271	result[in] = CalculateNativeIntDens(P,Lev0,CurrentDensity[in + NDIM*index],R->FactorDensityR);
3272	res += pow(result[in],2.);
3273	}
3274	res = sqrt(res);
3275	// if greater than 0, complain about it
3276	if ((res > MYEPSILON) && (P->Call.out[LeaderOut]))
3277	fprintf(stderr, "(%i) \\int_\\Omega d^3 r j_%i(r) = (%e,%e,%e), %e > %e!\n",P->Par.me, index, result[0], result[1], result[2], res, MYEPSILON);
3278	}
3279
3280	/** Testing whether re<->im switches (due to symmetry) confuses fft.
3281	* \param *P Problem at hand
3282	* \param l local wave function number
3283	*/
3284	void test_fft_symmetry(struct Problem *P, const int l)
3285	{
3286	struct Lattice *Lat = &P->Lat;
3287	struct RunStruct *R = &P->R;
3288	struct LatticeLevel *LevS = R->LevS;
3289	struct LatticeLevel *Lev0 = R->Lev0;
3290	struct Density *Dens0 = Lev0->Dens;
3291	struct fft_plan_3d *plan = Lat->plan;
3292	fftw_complex tempdestRC = (fftw_complex )Dens0->DensityCArray[Temp2Density];
3293	fftw_complex *work = Dens0->DensityCArray[TempDensity];
3294	fftw_complex workC = (fftw_complex )Dens0->DensityArray[TempDensity];
3295	fftw_complex posfac, destpos, destRCS, destRCD;
3296	fftw_complex *PsiC = Dens0->DensityCArray[ActualPsiDensity];
3297	fftw_real PsiCR = (fftw_real ) PsiC;
3298	fftw_complex *Psi0 = LevS->LPsi->LocalPsi[l];
3299	fftw_complex *dest = LevS->LPsi->TempPsi;
3300	fftw_real Psi0R = (fftw_real )Dens0->DensityArray[Temp2Density];
3301	int i,Index, pos, i0, iS,g; //, NoOfPsis = Psi->TypeStartIndex[UnOccupied] - Psi->TypeStartIndex[Occupied];
3302	int n[NDIM], n0;
3303	const int N0 = LevS->Plan0.plan->local_nx; // we don't want to build global density, but local
3304	int N[NDIM], NUp[NDIM];
3305	N[0] = LevS->Plan0.plan->N[0];
3306	N[1] = LevS->Plan0.plan->N[1];
3307	N[2] = LevS->Plan0.plan->N[2];
3308	NUp[0] = LevS->NUp[0];
3309	NUp[1] = LevS->NUp[1];
3310	NUp[2] = LevS->NUp[2];
3311	//const int k_normal = Lat->Psi.TypeStartIndex[Occupied] + (l - Lat->Psi.TypeStartIndex[R->CurrentMin]);
3312	//const double *Wcentre = Lat->Psi.AddData[k_normal].WannierCentre;
3313	//double x[NDIM], fac[NDIM];
3314	double result1=0., result2=0., result3=0., result4=0.;
3315	double Result1=0., Result2=0., Result3=0., Result4=0.;
3316	const double HGcRCFactor = 1./LevS->MaxN; // factor for inverse fft
3317
3318
3319	// fft to real space
3320	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
3321	SetArrayToDouble0((double )PsiC, Dens0->TotalSize2);
3322	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
3323	Index = LevS->GArray[i].Index;
3324	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
3325	destpos = &tempdestRC[LevS->MaxNUp*Index];
3326	for (pos=0; pos < LevS->MaxNUp; pos++) {
3327	destpos[pos].re = (Psi0[i].re)posfac[pos].re-(Psi0[i].im)posfac[pos].im;
3328	destpos[pos].im = (Psi0[i].re)posfac[pos].im+(Psi0[i].im)posfac[pos].re;
3329	//destpos[pos].re = (Psi0[i].im)posfac[pos].re-(-Psi0[i].re)posfac[pos].im;
3330	//destpos[pos].im = (Psi0[i].im)posfac[pos].im+(-Psi0[i].re)posfac[pos].re;
3331	}
3332	}
3333	for (i=0; i<LevS->MaxDoubleG; i++) {
3334	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
3335	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
3336	for (pos=0; pos < LevS->MaxNUp; pos++) {
3337	destRCD[pos].re = destRCS[pos].re;
3338	destRCD[pos].im = -destRCS[pos].im;
3339	}
3340	}
3341	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
3342	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, Psi0R);
3343
3344	// apply position operator and do first result
3345	for (n0=0;n0<N0;n0++) // only local points on x axis
3346	for (n[1]=0;n[1]<N[1];n[1]++)
3347	for (n[2]=0;n[2]<N[2];n[2]++) {
3348	n[0]=n0 + LevS->Plan0.plan->start_nx; // global relative coordinate: due to partitoning of x-axis in PEPGamma>1 case
3349	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
3350	iS = n[2]+N[2](n[1]+N[1]n0);
3351	//x[0] += 1; // shifting expectation value of x coordinate from 0 to 1
3352	PsiCR[iS] = Psi0R[i0]; // truedist(Lat, x[0], Wcentre[0],0) *
3353	result1 += PsiCR[iS] * Psi0R[i0];
3354	}
3355	result1 /= LevS->MaxN; // factor due to discrete integration
3356	MPI_Allreduce ( &result1, &Result1, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
3357	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 1st result: %e\n",P->Par.me, Result1);
3358
3359	// fft to reciprocal space and do second result
3360	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, PsiC, workC);
3361	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
3362	for (g=0; g < LevS->MaxG; g++) {
3363	Index = LevS->GArray[g].Index;
3364	dest[g].re = (Psi0[Index].re)*HGcRCFactor;
3365	dest[g].im = (Psi0[Index].im)*HGcRCFactor;
3366	}
3367	result2 = GradSP(P,LevS,Psi0,dest);
3368	MPI_Allreduce ( &result2, &Result2, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
3369	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 2nd result: %e\n",P->Par.me, Result2);
3370
3371	// fft again to real space, this time change symmetry
3372	SetArrayToDouble0((double )tempdestRC, Dens0->TotalSize2);
3373	SetArrayToDouble0((double )PsiC, Dens0->TotalSize2);
3374	for (i=0;i<LevS->MaxG;i++) { // incoming is positive, outgoing is positive
3375	Index = LevS->GArray[i].Index;
3376	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
3377	destpos = &tempdestRC[LevS->MaxNUp*Index];
3378	for (pos=0; pos < LevS->MaxNUp; pos++) {
3379	destpos[pos].re = (Psi0[i].im)posfac[pos].re-(-Psi0[i].re)posfac[pos].im;
3380	destpos[pos].im = (Psi0[i].im)posfac[pos].im+(-Psi0[i].re)posfac[pos].re;
3381	}
3382	}
3383	for (i=0; i<LevS->MaxDoubleG; i++) {
3384	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
3385	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
3386	for (pos=0; pos < LevS->MaxNUp; pos++) {
3387	destRCD[pos].re = destRCS[pos].re;
3388	destRCD[pos].im = -destRCS[pos].im;
3389	}
3390	}
3391	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
3392	DensityRTransformPos(LevS,(fftw_real*)tempdestRC, Psi0R);
3393
3394	// bring down from Lev0 to LevS
3395	for (n0=0;n0<N0;n0++) // only local points on x axis
3396	for (n[1]=0;n[1]<N[1];n[1]++)
3397	for (n[2]=0;n[2]<N[2];n[2]++) {
3398	i0 = n[2]NUp[2]+N[2]NUp[2](n[1]NUp[1]+N[1]NUp[1]n0*NUp[0]);
3399	iS = n[2]+N[2](n[1]+N[1]n0);
3400	PsiCR[iS] = Psi0R[i0]; // truedist(Lat, x[0], Wcentre[0],0) *
3401	result3 += PsiCR[iS] * Psi0R[i0];
3402	}
3403	result3 /= LevS->MaxN; // factor due to discrete integration
3404	MPI_Allreduce ( &result3, &Result3, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
3405	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 3rd result: %e\n",P->Par.me, Result3);
3406
3407	// fft back to reciprocal space, change symmetry back and do third result
3408	fft_3d_real_to_complex(plan, LevS->LevelNo, FFTNF1, PsiC, workC);
3409	SetArrayToDouble0((double )dest, 2R->InitLevS->MaxG);
3410	for (g=0; g < LevS->MaxG; g++) {
3411	Index = LevS->GArray[g].Index;
3412	dest[g].re = (-PsiC[Index].im)*HGcRCFactor;
3413	dest[g].im = ( PsiC[Index].re)*HGcRCFactor;
3414	}
3415	result4 = GradSP(P,LevS,Psi0,dest);
3416	MPI_Allreduce ( &result4, &Result4, 1, MPI_DOUBLE, MPI_SUM, P->Par.comm_ST_Psi); // sum "LocalSize to TotalSize"
3417	if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) 4th result: %e\n",P->Par.me, Result4);
3418	}
3419
3420
3421	/** Test function to check RxP application.
3422	* Checks applied solution to an analytic for a specific and simple wave function -
3423	* where just one coefficient is unequal to zero.
3424	* \param *P Problem at hand
3425	exp(I b G) - I exp(I b G) b G - exp(I a G) + I exp(I a G) a G
3426	-------------------------------------------------------------
3427	2
3428	G
3429	*/
3430	void test_rxp(struct Problem *P)
3431	{
3432	struct RunStruct *R = &P->R;
3433	struct Lattice *Lat = &P->Lat;
3434	//struct LatticeLevel *Lev0 = R->Lev0;
3435	struct LatticeLevel *LevS = R->LevS;
3436	struct OneGData *GA = LevS->GArray;
3437	//struct Density *Dens0 = Lev0->Dens;
3438	fftw_complex *Psi0 = LevS->LPsi->TempPsi;
3439	fftw_complex *Psi2 = P->Grad.GradientArray[GraSchGradient];
3440	fftw_complex *Psi3 = LevS->LPsi->TempPsi2;
3441	int g, g_bar, i, j, k, k_normal = 0;
3442	double tmp, a,b, G;
3443	//const double *Wcentre = Lat->Psi.AddData[k_normal].WannierCentre;
3444	const double discrete_factor = 1.;//Lat->Volume/LevS->MaxN;
3445	fftw_complex integral;
3446
3447	// reset coefficients
3448	debug (P,"Creating RxP test function.");
3449	SetArrayToDouble0((double )Psi0,2R->InitLevS->MaxG);
3450	SetArrayToDouble0((double )Psi2,2R->InitLevS->MaxG);
3451
3452	// pick one which becomes non-zero
3453	g = 3;
3454
3455	//for (g=0;g<LevS->MaxG;g++) {
3456	Psi0[g].re = 1.;
3457	Psi0[g].im = 0.;
3458	//}
3459	fprintf(stderr,"(%i) G[%i] = (%e,%e,%e) \n",P->Par.me, g, GA[g].G[0], GA[g].G[1], GA[g].G[2]);
3460	i = 0;
3461
3462	// calculate analytic result
3463	debug (P,"Calculating analytic solution.");
3464	for (g_bar=0;g_bar<LevS->MaxG;g_bar++) {
3465	for (g=0;g<LevS->MaxG;g++) {
3466	if (GA[g].G[i] == GA[g_bar].G[i]) {
3467	j = cross(i,0);
3468	k = cross(i,1);
3469	if (GA[g].G[k] == GA[g_bar].G[k]) {
3470	//b = truedist(Lat, sqrt(Lat->RealBasisSQ[j]), Wcentre[j], j);
3471	b = sqrt(Lat->RealBasisSQ[j]);
3472	//a = truedist(Lat, 0., Wcentre[j], j);
3473	a = 0.;
3474	G = 1; //GA[g].G[k];
3475	if (GA[g].G[j] == GA[g_bar].G[j]) {
3476	Psi2[g_bar].re += GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor;
3477	Psi2[g_bar].im += GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor;
3478	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
3479	//fprintf(stderr,"(%i) Psi[%i].re += %e +i %e\n",P->Par.me, g_bar, GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor, GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor);
3480	} else {
3481	tmp = GA[g].G[j]-GA[g_bar].G[j];
3482	integral.re = (cos(tmpb)+sin(tmpb)btmp - cos(tmpa)-sin(tmpa)atmp) / (tmp * tmp);
3483	integral.im = (sin(tmpb)-cos(tmpb)btmp - sin(tmpa)+cos(tmpa)atmp) / (tmp * tmp);
3484	Psi2[g_bar].re += G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor;
3485	Psi2[g_bar].im += G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor;
3486	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
3487	//fprintf(stderr,"(%i) Psi[%i].re += %e\tPsi[%i].im += %e \n",P->Par.me, g_bar, G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor, g_bar, G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor);
3488	}
3489	}
3490	j = cross(i,2);
3491	k = cross(i,3);
3492	if (GA[g].G[k] == GA[g_bar].G[k]) {
3493	//b = truedist(Lat, sqrt(Lat->RealBasisSQ[j]), Wcentre[j], j);
3494	b = sqrt(Lat->RealBasisSQ[j]);
3495	//a = truedist(Lat, 0., Wcentre[j], j);
3496	a = 0.;
3497	G = 1; //GA[g].G[k];
3498	if (GA[g].G[j] == GA[g_bar].G[j]) {
3499	Psi2[g_bar].re += GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor;
3500	Psi2[g_bar].im += GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor;
3501	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
3502	//fprintf(stderr,"(%i) Psi[%i].re += %e +i %e\n",P->Par.me, g_bar, GPsi0[g].re (.5 * b * b - .5 * a * a) * discrete_factor, GPsi0[g].im (.5 * b * b - .5 * a * a) * discrete_factor);
3503	} else {
3504	tmp = GA[g].G[j]-GA[g_bar].G[j];
3505	integral.re = (cos(tmpb)+sin(tmpb)btmp - cos(tmpa)-sin(tmpa)atmp) / (tmp * tmp);
3506	integral.im = (sin(tmpb)-cos(tmpb)btmp - sin(tmpa)+cos(tmpa)atmp) / (tmp * tmp);
3507	Psi2[g_bar].re += G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor;
3508	Psi2[g_bar].im += G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor;
3509	//if ((G != 0) && ((fabs(Psi0[g].re) > MYEPSILON) \|\| (fabs(Psi0[g].im) > MYEPSILON)))
3510	//fprintf(stderr,"(%i) Psi[%i].re += %e\tPsi[%i].im += %e \n",P->Par.me, g_bar, G(Psi0[g].reintegral.re - Psi0[g].imintegral.im) discrete_factor, g_bar, G(Psi0[g].reintegral.im + Psi0[g].imintegral.re) discrete_factor);
3511	}
3512	}
3513	}
3514	}
3515	}
3516
3517	// apply rxp
3518	debug (P,"Applying RxP to test function.");
3519	CalculatePerturbationOperator_RxP(P,Psi0,Psi3,k_normal,i);
3520
3521	// compare both coefficient arrays
3522	debug(P,"Beginning comparison of analytic and Rxp applied solution.");
3523	for (g=0;g<LevS->MaxG;g++) {
3524	if ((fabs(Psi3[g].re-Psi2[g].re) >= MYEPSILON) \|\| (fabs(Psi3[g].im-Psi2[g].im) >= MYEPSILON))
3525	fprintf(stderr,"(%i) Psi3[%i] = %e +i %e != Psi2[%i] = %e +i %e\n",P->Par.me, g, Psi3[g].re, Psi3[g].im, g, Psi2[g].re, Psi2[g].im);
3526	//else
3527	//fprintf(stderr,"(%i) Psi1[%i] == Psi2[%i] = %e +i %e\n",P->Par.me, g, g, Psi1[g].re, Psi1[g].im);
3528	}
3529	fprintf(stderr,"(%i) <0\|1> = <0\|r\|0> == %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi3), GradImSP(P,LevS,Psi0,Psi3));
3530	fprintf(stderr,"(%i) <1\|1> = \|r\|ï¿œ == %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi3,Psi3), GradImSP(P,LevS,Psi3,Psi3));
3531	fprintf(stderr,"(%i) <0\|0> = %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi0), GradImSP(P,LevS,Psi0,Psi0));
3532	fprintf(stderr,"(%i) <0\|2> = %e +i %e\n",P->Par.me, GradSP(P,LevS,Psi0,Psi2), GradImSP(P,LevS,Psi0,Psi2));
3533	}
3534
3535
3536	/** Output of a (X,Y,DX,DY) 2d-vector plot.
3537	* For a printable representation of the induced current two-dimensional vector plots are useful, as three-dimensional
3538	* isospheres are sometimes mis-leading or do not represent the desired flow direction. The routine simply extracts a
3539	* two-dimensional cut orthogonal to one of the lattice axis at a certain node.
3540	* \param *P Problem at hand
3541	* \param B_index direction of B field
3542	* \param n_orth grid node in B_index direction of the plane (the order in which the remaining two coordinate axis
3543	* appear is the same as in a cross product, which is used to determine orthogonality)
3544	*/
3545	void PlotVectorPlane(struct Problem *P, int B_index, int n_orth)
3546	{
3547	struct RunStruct *R = &P->R;
3548	struct LatticeLevel *Lev0 = R->Lev0;
3549	struct Density *Dens0 = Lev0->Dens;
3550	char filename[255];
3551	char *suchpointer;
3552	FILE *PlotFile = NULL;
3553	const int myPE = P->Par.me_comm_ST;
3554	time_t seconds;
3555	fftw_real CurrentDensity[NDIMNDIM];
3556	CurrentDensity[0] = (fftw_real *) Dens0->DensityArray[CurrentDensity0];
3557	CurrentDensity[1] = (fftw_real *) Dens0->DensityArray[CurrentDensity1];
3558	CurrentDensity[2] = (fftw_real *) Dens0->DensityArray[CurrentDensity2];
3559	CurrentDensity[3] = (fftw_real *) Dens0->DensityArray[CurrentDensity3];
3560	CurrentDensity[4] = (fftw_real *) Dens0->DensityArray[CurrentDensity4];
3561	CurrentDensity[5] = (fftw_real *) Dens0->DensityArray[CurrentDensity5];
3562	CurrentDensity[6] = (fftw_real *) Dens0->DensityArray[CurrentDensity6];
3563	CurrentDensity[7] = (fftw_real *) Dens0->DensityArray[CurrentDensity7];
3564	CurrentDensity[8] = (fftw_real *) Dens0->DensityArray[CurrentDensity8];
3565	time(&seconds); // get current time
3566
3567	if (!myPE) { // only process 0 writes to file
3568	// open file
3569	sprintf(&filename[0], ".current.L%i.csv", Lev0->LevelNo);
3570	OpenFile(P, &PlotFile, filename, "w", P->Call.out[ReadOut]);
3571	strcpy(filename, ctime(&seconds));
3572	suchpointer = strchr(filename, '\n');
3573	if (suchpointer != NULL)
3574	*suchpointer = '\0';
3575	if (PlotFile != NULL) {
3576	fprintf(PlotFile,"# current vector plot of plane perpendicular to direction e_%i at node %i, seed %i, config %s, run on %s, #cpus %i", B_index, n_orth, R->Seed, P->Files.default_path, filename, P->Par.Max_me_comm_ST_Psi);
3577	fprintf(PlotFile,"\n");
3578	} else { Error(SomeError, "PlotVectorPlane: Opening Plot File"); }
3579	}
3580
3581	// plot density
3582	if (!P->Par.me_comm_ST_PsiT) // only first wave function group as current density of all psis was gathered
3583	PlotRealDensity(P, Lev0, PlotFile, B_index, n_orth, CurrentDensity[B_indexNDIM+cross(B_index,0)], CurrentDensity[B_indexNDIM+cross(B_index,1)]);
3584
3585	if (PlotFile != NULL) {
3586	// close file
3587	fclose(PlotFile);
3588	}
3589	}
3590
3591
3592	/** Reads psi coefficients of \a type from file and transforms to new level.
3593	* \param *P Problem at hand
3594	* \param type PsiTypeTag of which minimisation group to load from file
3595	* \sa ReadSrcPsiDensity() - reading the coefficients, ChangePsiAndDensToLevUp() - transformation to upper level
3596	*/
3597	void ReadSrcPerturbedPsis(struct Problem *P, enum PsiTypeTag type)
3598	{
3599	struct RunStruct *R = &P->R;
3600	struct Lattice *Lat = &P->Lat;
3601	struct LatticeLevel *Lev0 = &P->Lat.Lev[R->Lev0No+1]; // one level higher than current (ChangeLevUp already occurred)
3602	struct LatticeLevel *LevS = &P->Lat.Lev[R->LevSNo+1];
3603	struct Density *Dens = Lev0->Dens;
3604	struct Psis *Psi = &Lat->Psi;
3605	struct fft_plan_3d *plan = Lat->plan;
3606	fftw_complex work = (fftw_complex )Dens->DensityCArray[TempDensity];
3607	fftw_complex tempdestRC = (fftw_complex )Dens->DensityArray[TempDensity];
3608	fftw_complex posfac, destpos, destRCS, destRCD;
3609	fftw_complex source, source0;
3610	int Index,i,pos;
3611	double factorC = 1./Lev0->MaxN;
3612	int p,g;
3613
3614	// ================= read coefficients from file to LocalPsi ============
3615	ReadSrcPsiDensity(P, type, 0, R->LevSNo+1);
3616
3617	// ================= transform to upper level ===========================
3618	// for all local Psis do the usual transformation (completing coefficients for all grid vectors, fft, permutation)
3619	LockDensityArray(Dens, TempDensity, real);
3620	LockDensityArray(Dens, TempDensity, imag);
3621	for (p=Psi->LocalNo-1; p >= 0; p--)
3622	if (Psi->LocalPsiStatus[p].PsiType == type) { // only for the desired type
3623	source = LevS->LPsi->LocalPsi[p];
3624	source0 = Lev0->LPsi->LocalPsi[p];
3625	//fprintf(stderr,"(%i) ReadSrcPerturbedPsis: LevSNo %i\t Lev0No %i\tp %i\t source %p\t source0 %p\n", P->Par.me, LevS->LevelNo, Lev0->LevelNo, p, source, source0);
3626	SetArrayToDouble0((double )tempdestRC, Dens->TotalSize2);
3627	for (i=0;i<LevS->MaxG;i++) {
3628	Index = LevS->GArray[i].Index;
3629	posfac = &LevS->PosFactorUp[LevS->MaxNUp*i];
3630	destpos = &tempdestRC[LevS->MaxNUp*Index];
3631	//if (isnan(source[i].re)) { fprintf(stderr,"(%i) WARNING in ReadSrcPerturbedPsis(): source_%i[%i] = NaN!\n", P->Par.me, p, i); Error(SomeError, "NaN-Fehler!"); }
3632	for (pos=0; pos < LevS->MaxNUp; pos++) {
3633	destpos[pos].re = source[i].reposfac[pos].re-source[i].imposfac[pos].im;
3634	destpos[pos].im = source[i].reposfac[pos].im+source[i].imposfac[pos].re;
3635	}
3636	}
3637	for (i=0; i<LevS->MaxDoubleG; i++) {
3638	destRCS = &tempdestRC[LevS->DoubleG[2i]LevS->MaxNUp];
3639	destRCD = &tempdestRC[LevS->DoubleG[2i+1]LevS->MaxNUp];
3640	for (pos=0; pos < LevS->MaxNUp; pos++) {
3641	destRCD[pos].re = destRCS[pos].re;
3642	destRCD[pos].im = -destRCS[pos].im;
3643	}
3644	}
3645	fft_3d_complex_to_real(plan, LevS->LevelNo, FFTNFUp, tempdestRC, work);
3646	DensityRTransformPos(LevS,(fftw_real)tempdestRC,(fftw_real )Dens->DensityCArray[ActualPsiDensity]);
3647	// now we have density in the upper level, fft back to complex and store it as wave function coefficients
3648	fft_3d_real_to_complex(plan, Lev0->LevelNo, FFTNF1, Dens->DensityCArray[ActualPsiDensity], work);
3649	for (g=0; g < Lev0->MaxG; g++) {
3650	Index = Lev0->GArray[g].Index;
3651	source0[g].re = Dens->DensityCArray[ActualPsiDensity][Index].re*factorC;
3652	source0[g].im = Dens->DensityCArray[ActualPsiDensity][Index].im*factorC;
3653	//if (isnan(source0[g].re)) { fprintf(stderr,"(%i) WARNING in ReadSrcPerturbedPsis(): source0_%i[%i] = NaN!\n", P->Par.me, p, g); Error(SomeError, "NaN-Fehler!"); }
3654	}
3655	if (Lev0->GArray[0].GSq == 0.0)
3656	source0[g].im = 0.0;
3657	}
3658	UnLockDensityArray(Dens, TempDensity, real);
3659	UnLockDensityArray(Dens, TempDensity, imag);
3660	// finished.
3661	}
3662
3663	/** evaluates perturbed energy functional
3664	* \param norm norm of current Psi in functional
3665	* \param *params void-pointer to parameter array
3666	* \return evaluated functional at f(x) with \a norm
3667	*/
3668	double perturbed_function (double norm, void *params) {
3669	struct Problem P = (struct Problem )params;
3670	int i, n = P->R.LevS->MaxG;
3671	double old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
3672	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
3673	fprintf(stderr,"(%i) perturbed_function: setting norm to %lg ...", P->Par.me, norm);
3674	// set desired norm for current Psi
3675	for (i=0; i< n; i++) {
3676	currentPsi[i].re *= norm/old_norm; // real part
3677	currentPsi[i].im *= norm/old_norm; // imaginary part
3678	}
3679	P->R.PsiStep = 0; // make it not advance to next Psi
3680
3681	//debug(P,"UpdateActualPsiNo");
3682	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
3683	//debug(P,"UpdateEnergyArray");
3684	UpdateEnergyArray(P); // shift energy values in their array by one
3685	//debug(P,"UpdatePerturbedEnergyCalculation");
3686	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
3687	EnergyAllReduce(P); // gather from all processes and sum up to total energy
3688	/*
3689	for (i=0; i< n; i++) {
3690	currentPsi[i].re /= norm/old_norm; // real part
3691	currentPsi[i].im /= norm/old_norm; // imaginary part
3692	}*/
3693
3694	fprintf(stderr,"%lg\n", P->Lat.E->TotalEnergy[0]);
3695	return P->Lat.E->TotalEnergy[0]; // and return evaluated functional
3696	}
3697
3698	/** evaluates perturbed energy functional.
3699	* \param *x current position in functional
3700	* \param *params void-pointer to parameter array
3701	* \return evaluated functional at f(x)
3702	*/
3703	double perturbed_f (const gsl_vector x, void params) {
3704	struct Problem P = (struct Problem )params;
3705	int i, n = P->R.LevS->MaxG*2;
3706	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
3707	//int diff = 0;
3708	//debug(P,"f");
3709	// put x into current Psi
3710	for (i=0; i< n; i+=2) {
3711	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
3712	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
3713	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
3714	}
3715	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
3716	P->R.PsiStep = 0; // make it not advance to next Psi
3717
3718	//debug(P,"UpdateActualPsiNo");
3719	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
3720	//debug(P,"UpdateEnergyArray");
3721	UpdateEnergyArray(P); // shift energy values in their array by one
3722	//debug(P,"UpdatePerturbedEnergyCalculation");
3723	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
3724	EnergyAllReduce(P); // gather from all processes and sum up to total energy
3725
3726	return P->Lat.E->TotalEnergy[0]; // and return evaluated functional
3727	}
3728
3729	/** evaluates perturbed energy gradient.
3730	* \param *x current position in functional
3731	* \param *params void-pointer to parameter array
3732	* \param *g array for gradient vector on return
3733	*/
3734	void perturbed_df (const gsl_vector x, void params, gsl_vector *g) {
3735	struct Problem P = (struct Problem )params;
3736	int i, n = P->R.LevS->MaxG*2;
3737	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
3738	fftw_complex *gradient = P->Grad.GradientArray[ActualGradient];
3739	//int diff = 0;
3740	//debug(P,"df");
3741	// put x into current Psi
3742	for (i=0; i< n; i+=2) {
3743	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
3744	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
3745	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
3746	}
3747	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
3748	P->R.PsiStep = 0; // make it not advance to next Psi
3749
3750	//debug(P,"UpdateActualPsiNo");
3751	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
3752	//debug(P,"UpdateEnergyArray");
3753	UpdateEnergyArray(P); // shift energy values in their array by one
3754	//debug(P,"UpdatePerturbedEnergyCalculation");
3755	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
3756	EnergyAllReduce(P); // gather from all processes and sum up to total energy
3757
3758	// checkout gradient
3759	//diff = 0;
3760	for (i=0; i< n; i+=2) {
3761	//if ((-gradient[i/2].re != gsl_vector_get (g, i)) \|\| (-gradient[i/2].im != gsl_vector_get (g, i+1))) diff++;
3762	gsl_vector_set (g, i, -gradient[i/2].re); // real part
3763	gsl_vector_set (g, i+1, -gradient[i/2].im); // imaginary part
3764	}
3765	//if (diff) fprintf(stderr,"(%i) %i differences between old and new gradient.\n", P->Par.me, diff);
3766	}
3767
3768	/** evaluates perturbed energy functional and gradient.
3769	* \param *x current position in functional
3770	* \param *params void-pointer to parameter array
3771	* \param *f pointer to energy function value on return
3772	* \param *g array for gradient vector on return
3773	*/
3774	void perturbed_fdf (const gsl_vector x, void params, double f, gsl_vector g) {
3775	struct Problem P = (struct Problem )params;
3776	int i, n = P->R.LevS->MaxG*2;
3777	fftw_complex *currentPsi = P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo];
3778	fftw_complex *gradient = P->Grad.GradientArray[ActualGradient];
3779	//int diff = 0;
3780	//debug(P,"fdf");
3781	// put x into current Psi
3782	for (i=0; i< n; i+=2) {
3783	//if ((currentPsi[i/2].re != gsl_vector_get (x, i)) \|\| (currentPsi[i/2].im != gsl_vector_get (x, i+1))) diff++;
3784	currentPsi[i/2].re = gsl_vector_get (x, i); // real part
3785	currentPsi[i/2].im = gsl_vector_get (x, i+1); // imaginary part
3786	}
3787	//if (diff) fprintf(stderr,"(%i) %i differences between old and new currentPsi.\n", P->Par.me, diff);
3788	P->R.PsiStep = 0; // make it not advance to next Psi
3789
3790	//debug(P,"UpdateActualPsiNo");
3791	UpdateActualPsiNo(P, P->R.CurrentMin); // orthogonalize
3792	//debug(P,"UpdateEnergyArray");
3793	UpdateEnergyArray(P); // shift energy values in their array by one
3794	//debug(P,"UpdatePerturbedEnergyCalculation");
3795	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
3796	EnergyAllReduce(P); // gather from all processes and sum up to total energy
3797
3798	// checkout gradient
3799	//diff = 0;
3800	for (i=0; i< n; i+=2) {
3801	//if ((-gradient[i/2].re != gsl_vector_get (g, i)) \|\| (-gradient[i/2].im != gsl_vector_get (g, i+1))) diff++;
3802	gsl_vector_set (g, i, -gradient[i/2].re); // real part
3803	gsl_vector_set (g, i+1, -gradient[i/2].im); // imaginary part
3804	}
3805	//if (diff) fprintf(stderr,"(%i) %i differences between old and new gradient.\n", P->Par.me, diff);
3806
3807	*f = P->Lat.E->TotalEnergy[0]; // and return evaluated functional
3808	}
3809
3810	/* MinimisePerturbed with all the brent minimisation approach
3811	void MinimisePerturbed (struct Problem P, int Stop, int *SuperStop) {
3812	struct RunStruct *R = &P->R;
3813	struct Lattice *Lat = &P->Lat;
3814	struct Psis *Psi = &Lat->Psi;
3815	int type;
3816	//int i;
3817
3818	// stuff for GSL minimization
3819	//size_t iter;
3820	//int status, Status
3821	int n = R->LevS->MaxG*2;
3822	const gsl_multimin_fdfminimizer_type *T_multi;
3823	const gsl_min_fminimizer_type *T;
3824	gsl_multimin_fdfminimizer *s_multi;
3825	gsl_min_fminimizer *s;
3826	gsl_vector x;//, ss;
3827	gsl_multimin_function_fdf my_func;
3828	gsl_function F;
3829	//fftw_complex *currentPsi;
3830	//double a,b,m, f_m, f_a, f_b;
3831	//double old_norm;
3832
3833	my_func.f = &perturbed_f;
3834	my_func.df = &perturbed_df;
3835	my_func.fdf = &perturbed_fdf;
3836	my_func.n = n;
3837	my_func.params = P;
3838	F.function = &perturbed_function;
3839	F.params = P;
3840
3841	x = gsl_vector_alloc (n);
3842	//ss = gsl_vector_alloc (Psi->NoOfPsis);
3843	T_multi = gsl_multimin_fdfminimizer_vector_bfgs;
3844	s_multi = gsl_multimin_fdfminimizer_alloc (T_multi, n);
3845	T = gsl_min_fminimizer_brent;
3846	s = gsl_min_fminimizer_alloc (T);
3847
3848	for (type=Perturbed_P0;type<=Perturbed_RxP2;type++) { // go through each perturbation group separately //
3849	*Stop=0; // reset stop flag
3850	fprintf(stderr,"(%i)Beginning perturbed minimisation of type %s ...\n", P->Par.me, R->MinimisationName[type]);
3851	//OutputOrbitalPositions(P, Occupied);
3852	R->PsiStep = R->MaxPsiStep; // reset in-Psi-minimisation-counter, so that we really advance to the next wave function
3853	UpdateActualPsiNo(P, type); // step on to next perturbed one
3854	fprintf(stderr, "(%i) Re-initializing perturbed psi array for type %s ", P->Par.me, R->MinimisationName[type]);
3855	if (P->Call.ReadSrcFiles && ReadSrcPsiDensity(P,type,1, R->LevSNo)) {
3856	SpeedMeasure(P, InitSimTime, StartTimeDo);
3857	fprintf(stderr,"from source file of recent calculation\n");
3858	ReadSrcPsiDensity(P,type, 0, R->LevSNo);
3859	ResetGramSchTagType(P, Psi, type, IsOrthogonal); // loaded values are orthonormal
3860	SpeedMeasure(P, DensityTime, StartTimeDo);
3861	//InitDensityCalculation(P);
3862	SpeedMeasure(P, DensityTime, StopTimeDo);
3863	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
3864	UpdateGramSchOldActualPsiNo(P,Psi);
3865	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
3866	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
3867	EnergyAllReduce(P); // gather energies for minimum search
3868	SpeedMeasure(P, InitSimTime, StopTimeDo);
3869	}
3870	if (P->Call.ReadSrcFiles != 1) {
3871	SpeedMeasure(P, InitSimTime, StartTimeDo);
3872	ResetGramSchTagType(P, Psi, type, NotOrthogonal); // perturbed now shall be orthonormalized
3873	if (P->Call.ReadSrcFiles != 2) {
3874	if (R->LevSNo == Lat->MaxLevel-1) { // is it the starting level? (see InitRunLevel())
3875	fprintf(stderr, "randomly.\n");
3876	InitPsisValue(P, Psi->TypeStartIndex[type], Psi->TypeStartIndex[type+1]); // initialize perturbed array for this run
3877	} else {
3878	fprintf(stderr, "from source file of last level.\n");
3879	ReadSrcPerturbedPsis(P, type);
3880	}
3881	}
3882	SpeedMeasure(P, InitGramSchTime, StartTimeDo);
3883	GramSch(P, R->LevS, Psi, Orthogonalize);
3884	SpeedMeasure(P, InitGramSchTime, StopTimeDo);
3885	SpeedMeasure(P, InitDensityTime, StartTimeDo);
3886	//InitDensityCalculation(P);
3887	SpeedMeasure(P, InitDensityTime, StopTimeDo);
3888	InitPerturbedEnergyCalculation(P, 1); // go through all orbitals calculate each H^{(0)}-eigenvalue, recalc HGDensity, cause InitDensityCalc zero'd it
3889	R->OldActualLocalPsiNo = R->ActualLocalPsiNo; // needed otherwise called routines in function below crash
3890	UpdateGramSchOldActualPsiNo(P,Psi);
3891	UpdatePerturbedEnergyCalculation(P); // H1cGradient and Gradient must be current ones
3892	EnergyAllReduce(P); // gather energies for minimum search
3893	SpeedMeasure(P, InitSimTime, StopTimeDo);
3894	R->LevS->Step++;
3895	EnergyOutput(P,0);
3896	while (*Stop != 1) {
3897	// copy current Psi into starting vector
3898	currentPsi = R->LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
3899	for (i=0; i< n; i+=2) {
3900	gsl_vector_set (x, i, currentPsi[i/2].re); // real part
3901	gsl_vector_set (x, i+1, currentPsi[i/2].im); // imaginary part
3902	}
3903	gsl_multimin_fdfminimizer_set (s_multi, &my_func, x, 0.01, 1e-2);
3904	iter = 0;
3905	status = 0;
3906	do { // look for minimum along current local psi
3907	iter++;
3908	status = gsl_multimin_fdfminimizer_iterate (s_multi);
3909	MPI_Allreduce(&status, &Status, 1, MPI_INT, MPI_MAX, P->Par.comm_ST_Psi);
3910	if (Status)
3911	break;
3912	status = gsl_multimin_test_gradient (s_multi->gradient, 1e-2);
3913	MPI_Allreduce(&status, &Status, 1, MPI_INT, MPI_MAX, P->Par.comm_ST_Psi);
3914	//if (Status == GSL_SUCCESS)
3915	//printf ("Minimum found at:\n");
3916	if (P->Par.me == 0) fprintf (stderr,"(%i,%i,%i)S(%i,%i,%i):\t %5d %10.5f\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, (int)iter, s_multi->f);
3917	//TestGramSch(P,R->LevS,Psi, type); // functions are orthonormal?
3918	} while (Status == GSL_CONTINUE && iter < 3);
3919	// now minimize norm of currentPsi (one-dim)
3920	if (0) {
3921	iter = 0;
3922	status = 0;
3923	m = 1.;
3924	a = MYEPSILON;
3925	b = 100.;
3926	f_a = perturbed_function (a, P);
3927	f_b = perturbed_function (b, P);
3928	f_m = perturbed_function (m, P);
3929	//if ((f_m < f_a) && (f_m < f_b)) {
3930	gsl_min_fminimizer_set (s, &F, m, a, b);
3931	do { // look for minimum along current local psi
3932	iter++;
3933	status = gsl_min_fminimizer_iterate (s);
3934	m = gsl_min_fminimizer_x_minimum (s);
3935	a = gsl_min_fminimizer_x_lower (s);
3936	b = gsl_min_fminimizer_x_upper (s);
3937	status = gsl_min_test_interval (a, b, 0.001, 0.0);
3938	if (status == GSL_SUCCESS)
3939	printf ("Minimum found at:\n");
3940	printf ("%5d [%.7f, %.7f] %.7f %.7f\n",
3941	(int) iter, a, b,
3942	m, b - a);
3943	} while (status == GSL_CONTINUE && iter < 100);
3944	old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
3945	for (i=0; i< n; i++) {
3946	currentPsi[i].re *= m/old_norm; // real part
3947	currentPsi[i].im *= m/old_norm; // imaginary part
3948	}
3949	} else debug(P,"Norm not minimizable!");
3950	//P->R.PsiStep = P->R.MaxPsiStep; // make it advance to next Psi
3951	FindPerturbedMinimum(P);
3952	//debug(P,"UpdateActualPsiNo");
3953	UpdateActualPsiNo(P, type); // step on to next perturbed Psi
3954	//debug(P,"UpdateEnergyArray");
3955	UpdateEnergyArray(P); // shift energy values in their array by one
3956	//debug(P,"UpdatePerturbedEnergyCalculation");
3957	UpdatePerturbedEnergyCalculation(P); // re-calc energies (which is hopefully lower)
3958	EnergyAllReduce(P); // gather from all processes and sum up to total energy
3959	//ControlNativeDensity(P); // check total density (summed up PertMixed must be zero!)
3960	//printf ("(%i,%i,%i)S(%i,%i,%i):\t %5d %10.5f\n",P->Par.my_color_comm_ST,P->Par.me_comm_ST, P->Par.me_comm_ST_PsiT, R->MinStep, R->ActualLocalPsiNo, R->PsiStep, (int)iter, s_multi->f);
3961	if (*SuperStop != 1)
3962	*SuperStop = CheckCPULIM(P);
3963	Stop = CalculateMinimumStop(P, SuperStop);
3964	P->Speed.Steps++; // step on
3965	R->LevS->Step++;
3966	}
3967	// now release normalization condition and minimize wrt to norm
3968	*Stop = 0;
3969	while (*Stop != 1) {
3970	currentPsi = R->LevS->LPsi->LocalPsi[R->ActualLocalPsiNo];
3971	iter = 0;
3972	status = 0;
3973	m = 1.;
3974	a = 0.001;
3975	b = 10.;
3976	f_a = perturbed_function (a, P);
3977	f_b = perturbed_function (b, P);
3978	f_m = perturbed_function (m, P);
3979	if ((f_m < f_a) && (f_m < f_b)) {
3980	gsl_min_fminimizer_set (s, &F, m, a, b);
3981	do { // look for minimum along current local psi
3982	iter++;
3983	status = gsl_min_fminimizer_iterate (s);
3984	m = gsl_min_fminimizer_x_minimum (s);
3985	a = gsl_min_fminimizer_x_lower (s);
3986	b = gsl_min_fminimizer_x_upper (s);
3987	status = gsl_min_test_interval (a, b, 0.001, 0.0);
3988	if (status == GSL_SUCCESS)
3989	printf ("Minimum found at:\n");
3990	printf ("%5d [%.7f, %.7f] %.7f %.7f\n",
3991	(int) iter, a, b,
3992	m, b - a);
3993	} while (status == GSL_CONTINUE && iter < 100);
3994	old_norm = GramSchGetNorm2(P,P->R.LevS,P->R.LevS->LPsi->LocalPsi[P->R.ActualLocalPsiNo]);
3995	for (i=0; i< n; i++) {
3996	currentPsi[i].re *= m/old_norm; // real part
3997	currentPsi[i].im *= m/old_norm; // imaginary part
3998	}
3999	}
4000	P->R.PsiStep = P->R.MaxPsiStep; // make it advance to next Psi
4001	//debug(P,"UpdateActualPsiNo");
4002	UpdateActualPsiNo(P, type); // step on to next perturbed Psi
4003	if (*SuperStop != 1)
4004	*SuperStop = CheckCPULIM(P);
4005	Stop = CalculateMinimumStop(P, SuperStop);
4006	P->Speed.Steps++; // step on
4007	R->LevS->Step++;
4008	}
4009	if(P->Call.out[NormalOut]) fprintf(stderr,"(%i) Write %s srcpsi to disk\n", P->Par.me, R->MinimisationName[type]);
4010	OutputSrcPsiDensity(P, type);
4011	// if (!TestReadnWriteSrcDensity(P,type))
4012	// Error(SomeError,"TestReadnWriteSrcDensity failed!");
4013	}
4014
4015	TestGramSch(P,R->LevS,Psi, type); // functions are orthonormal?
4016	// calculate current density summands
4017	//if (P->Call.out[StepLeaderOut]) fprintf(stderr,"(%i) Filling current density grid ...\n",P->Par.me);
4018	SpeedMeasure(P, CurrDensTime, StartTimeDo);
4019	if (*SuperStop != 1) {
4020	if ((R->DoFullCurrent == 1) \|\| ((R->DoFullCurrent == 2) && (CheckOrbitalOverlap(P) == 1))) { //test to check whether orbitals have mutual overlap and thus \\DeltaJ_{xc} must not be dropped
4021	R->DoFullCurrent = 1; // set to 1 if it was 2 but Check...() yielded necessity
4022	//debug(P,"Filling with Delta j ...");
4023	//FillDeltaCurrentDensity(P);
4024	}// else
4025	//debug(P,"There is no overlap between orbitals.");
4026	//debug(P,"Filling with j ...");
4027	FillCurrentDensity(P);
4028	}
4029	SpeedMeasure(P, CurrDensTime, StopTimeDo);
4030
4031	SetGramSchExtraPsi(P,Psi,NotUsedToOrtho); // remove extra Psis from orthogonality check
4032	ResetGramSchTagType(P, Psi, type, NotUsedToOrtho); // remove this group from the check for the next minimisation group as well!
4033	}
4034	UpdateActualPsiNo(P, Occupied); // step on back to an occupied one
4035
4036	gsl_multimin_fdfminimizer_free (s_multi);
4037	gsl_min_fminimizer_free (s);
4038	gsl_vector_free (x);
4039	//gsl_vector_free (ss);
4040	}
4041	*/

Note: See TracBrowser for help on using the repository browser.

Download in other formats: