00001
00002
00003
00004
00005
00006
00007 #ifndef __clover_term_base_w_h__
00008 #define __clover_term_base_w_h__
00009
00010 #include "linearop.h"
00011
00012
00013 namespace Chroma
00014 {
00015
00016
00017
00018
00019
00020
00021 template<typename T, typename U>
00022 class CloverTermBase : public DslashLinearOperator<T,
00023 multi1d<U>,
00024 multi1d<U> >
00025 {
00026 public:
00027
00028 virtual ~CloverTermBase() {}
00029
00030
00031 const Subset& subset() const {return all;}
00032
00033
00034 virtual void applySite(T& chi, const T& psi, enum PlusMinus isign, int site) const = 0;
00035
00036
00037
00038
00039
00040 virtual void choles(int cb) = 0;
00041
00042
00043
00044
00045
00046
00047
00048 virtual Double cholesDet(int cb) const = 0;
00049
00050
00051
00052
00053
00054
00055
00056
00057
00058 void deriv(multi1d<U>& ds_u,
00059 const T& chi, const T& psi,
00060 enum PlusMinus isign) const;
00061
00062
00063
00064
00065
00066
00067
00068
00069
00070
00071 void deriv(multi1d<U>& ds_u,
00072 const T& chi, const T& psi,
00073 enum PlusMinus isign, int cb) const;
00074
00075
00076 void derivTrLn(multi1d<U>& ds_u,
00077 enum PlusMinus isign, int cb) const;
00078
00079
00080 void deriv_loops(const int u, const int mu, const int cb,
00081 U& ds_u_mu,
00082 U& ds_u_nu,
00083 const U& Lambda) const;
00084
00085
00086 unsigned long nFlops() const;
00087
00088
00089 virtual void triacntr(U& B, int mat, int cb) const = 0;
00090
00091 protected:
00092
00093
00094 virtual const multi1d<U>& getU() const = 0;
00095
00096
00097 virtual Real getCloverCoeff(int mu, int nu) const = 0;
00098
00099 };
00100
00101
00102 template<typename T, typename U>
00103 unsigned long
00104 CloverTermBase<T,U>::nFlops() const {return 552;}
00105
00106
00107
00108
00109
00110
00111
00112
00113
00114
00115 template<typename T, typename U>
00116 void CloverTermBase<T,U>::deriv(multi1d<U>& ds_u,
00117 const T& chi, const T& psi,
00118 enum PlusMinus isign) const
00119 {
00120 START_CODE();
00121
00122
00123
00124 deriv(ds_u, chi, psi, isign,0);
00125
00126
00127 multi1d<U> ds_tmp;
00128 deriv(ds_tmp, chi, psi, isign,1);
00129
00130 ds_u += ds_tmp;
00131
00132 END_CODE();
00133 }
00134
00135
00136
00137 template<typename T, typename U>
00138 void CloverTermBase<T,U>::deriv_loops(const int mu, const int nu, const int cb,
00139 U& ds_u_mu,
00140 U& ds_u_nu,
00141 const U& Lambda) const
00142 {
00143 START_CODE();
00144
00145 const multi1d<U>& u = getU();
00146
00147
00148
00149
00150
00151
00152
00153
00154
00155
00156
00157
00158
00159
00160
00161
00162
00163
00164
00165
00166
00167
00168 U staple_for;
00169 U staple_back;
00170 U staple_left;
00171 U staple_right;
00172
00173 U u_nu_for_mu = shift(u[nu],FORWARD, mu);
00174 U u_mu_for_nu = shift(u[mu],FORWARD, nu);
00175 U Lambda_xplus_mu = shift(Lambda, FORWARD, mu);
00176 U Lambda_xplus_nu = shift(Lambda, FORWARD, nu);
00177 U Lambda_xplus_muplusnu = shift(Lambda_xplus_mu, FORWARD, nu);
00178
00179 U u_tmp3;
00180
00181 U ds_tmp_mu;
00182 U ds_tmp_nu;
00183 {
00184 U up_left_corner;
00185 U up_right_corner;
00186 U low_right_corner;
00187 U low_left_corner;
00188
00189
00190
00191
00192
00193
00194 up_left_corner = adj(u_mu_for_nu)*adj(u[nu]);
00195
00196
00197
00198
00199
00200
00201
00202
00203 up_right_corner = u_nu_for_mu*adj(u_mu_for_nu);
00204
00205
00206
00207
00208
00209
00210 low_right_corner = adj(u_nu_for_mu)*adj(u[mu]);
00211
00212
00213
00214
00215
00216
00217
00218 low_left_corner = adj(u[mu])*u[nu];
00219
00220
00221
00222
00223
00224
00225
00226
00227
00228
00229
00230
00231
00232
00233
00234
00235 u_tmp3[rb[cb]] = u_nu_for_mu*Lambda_xplus_muplusnu;
00236 ds_u_mu[rb[cb]] = u_tmp3*up_left_corner;
00237
00238
00239
00240
00241
00242
00243
00244
00245
00246
00247 u_tmp3[rb[1-cb]] = adj(u_mu_for_nu)*Lambda_xplus_nu;
00248
00249
00250 ds_tmp_nu[rb[1-cb]] = u_tmp3*adj(low_left_corner);
00251
00252
00253
00254
00255
00256
00257
00258
00259
00260
00261
00262 u_tmp3[rb[1-cb]] = Lambda_xplus_nu*adj(u[nu]);
00263 ds_u_mu[rb[1-cb]] = up_right_corner * u_tmp3;
00264
00265
00266
00267
00268
00269
00270
00271
00272
00273
00274 u_tmp3[rb[cb]] = up_left_corner*Lambda;
00275
00276
00277 ds_tmp_nu[rb[cb]] = u_tmp3*u[mu];
00278
00279
00280
00281
00282
00283
00284
00285
00286
00287
00288
00289
00290
00291
00292
00293
00294
00295
00296
00297
00298
00299
00300
00301 u_tmp3[rb[1-cb]] = adj(u_nu_for_mu)*Lambda_xplus_mu;
00302
00303
00304 ds_tmp_mu[rb[1-cb]] = u_tmp3*low_left_corner;
00305
00306
00307
00308
00309
00310
00311
00312
00313
00314 u_tmp3[rb[1-cb]] = adj(up_right_corner)*Lambda_xplus_mu;
00315 ds_u_nu[rb[1-cb]] = u_tmp3*adj(u[mu]);
00316
00317
00318
00319
00320
00321
00322
00323
00324
00325
00326
00327 u_tmp3[rb[cb]] = low_right_corner*Lambda;
00328
00329
00330 ds_tmp_mu[rb[cb]] = u_tmp3*u[nu];
00331
00332
00333
00334
00335
00336
00337
00338
00339
00340
00341
00342 u_tmp3[rb[cb]] = u_mu_for_nu*Lambda_xplus_muplusnu;
00343 ds_u_nu[rb[cb]] = u_tmp3*low_right_corner;
00344
00345
00346
00347
00348
00349
00350
00351
00352
00353
00354
00355
00356
00357
00358
00359
00360
00361 staple_for = u_nu_for_mu*up_left_corner;
00362
00363
00364
00365
00366
00367
00368
00369 staple_right = up_left_corner*u[mu];
00370
00371
00372
00373
00374
00375
00376
00377
00378 staple_left = u_mu_for_nu*low_right_corner;
00379
00380
00381
00382
00383
00384
00385
00386
00387
00388 staple_back = adj(u_nu_for_mu)*low_left_corner;
00389
00390 }
00391
00392
00393
00394
00395
00396
00397
00398
00399
00400 ds_u_mu[rb[cb]] += staple_for*Lambda;
00401
00402
00403
00404
00405
00406
00407
00408
00409
00410
00411
00412
00413 ds_tmp_nu[rb[1-cb]] += staple_right*Lambda_xplus_mu;
00414
00415
00416
00417
00418
00419
00420
00421
00422
00423
00424 ds_u_mu[rb[1-cb]] += Lambda_xplus_mu*staple_for;
00425
00426
00427
00428
00429
00430
00431
00432
00433
00434
00435 ds_tmp_nu[rb[cb]] += Lambda_xplus_muplusnu * staple_right;
00436
00437
00438
00439
00440
00441
00442
00443
00444
00445
00446
00447
00448 ds_tmp_mu[rb[1-cb]] += staple_back*Lambda_xplus_nu;
00449
00450
00451
00452
00453
00454
00455
00456
00457
00458 ds_u_nu[rb[cb]] += staple_left*Lambda;
00459
00460
00461
00462
00463
00464
00465
00466
00467
00468
00469 ds_tmp_mu[rb[cb]] += Lambda_xplus_muplusnu * staple_back;
00470
00471
00472
00473
00474
00475
00476
00477
00478
00479 ds_u_nu[rb[1-cb]] += Lambda_xplus_nu * staple_left;
00480
00481
00482
00483
00484 ds_u_mu -= shift(ds_tmp_mu, BACKWARD, nu);
00485 ds_u_nu -= shift(ds_tmp_nu, BACKWARD, mu);
00486
00487 END_CODE();
00488 }
00489
00490
00491
00492
00493
00494
00495
00496
00497
00498
00499
00500 template<typename T, typename U>
00501 void CloverTermBase<T,U>::deriv(multi1d<U>& ds_u,
00502 const T& chi, const T& psi,
00503 enum PlusMinus isign, int cb) const
00504 {
00505 START_CODE();
00506
00507
00508
00509 if( ds_u.size() != Nd ) {
00510 ds_u.resize(Nd);
00511 }
00512
00513 ds_u = zero;
00514
00515
00516 const multi1d<U>& u = getU();
00517
00518
00519
00520 for(int mu=0; mu < Nd; mu++) {
00521 for(int nu = mu+1; nu < Nd; nu++) {
00522
00523
00524
00525 U ds_tmp_mu;
00526
00527
00528
00529 U ds_tmp_nu;
00530
00531
00532 Real factor = (Real(-1)/Real(8))*getCloverCoeff(mu,nu);
00533
00534
00535
00536
00537 int mu_nu_index = (1 << mu) + (1 << nu);
00538 T ferm_tmp = Gamma(mu_nu_index)*psi;
00539 U s_xy_dag = traceSpin( outerProduct(ferm_tmp,chi));
00540 s_xy_dag *= Real(factor);
00541
00542
00543 deriv_loops(mu, nu, cb, ds_tmp_mu, ds_tmp_nu, s_xy_dag);
00544
00545
00546 ds_u[mu] += ds_tmp_mu;
00547 ds_u[nu] -= ds_tmp_nu;
00548
00549
00550 }
00551 }
00552
00553
00554
00555 (*this).getFermBC().zero(ds_u);
00556 END_CODE();
00557 }
00558
00559
00560
00561
00562
00563
00564
00565
00566
00567
00568
00569 template<typename T, typename U>
00570 void CloverTermBase<T,U>::derivTrLn(multi1d<U>& ds_u,
00571 enum PlusMinus isign, int cb) const
00572 {
00573 START_CODE();
00574
00575
00576 if( ds_u.size() != Nd ) {
00577 ds_u.resize(Nd);
00578 }
00579
00580 ds_u = zero;
00581
00582 for(int mu=0; mu < Nd; mu++) {
00583 for(int nu = mu+1; nu < Nd; nu++) {
00584
00585
00586 int mu_nu_index = (1 << mu) + (1 << nu);
00587
00588
00589 Real factor = Real(-1)*getCloverCoeff(mu,nu)/Real(8);
00590
00591 U sigma_XY_dag=zero;
00592
00593
00594 triacntr(sigma_XY_dag, mu_nu_index, cb);
00595 sigma_XY_dag[rb[cb]] *= factor;
00596
00597
00598 U ds_tmp_mu;
00599 U ds_tmp_nu;
00600
00601
00602 deriv_loops(mu, nu, cb, ds_tmp_mu, ds_tmp_nu, sigma_XY_dag);
00603
00604
00605 ds_u[mu] += ds_tmp_mu;
00606
00607
00608 ds_u[nu] -= ds_tmp_nu;
00609
00610 }
00611
00612 }
00613
00614
00615
00616 (*this).getFermBC().zero(ds_u);
00617
00618 END_CODE();
00619 }
00620
00621
00622
00623 }
00624
00625
00626 #endif