forked from etmc/tmLQCD
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathget_staples.c
124 lines (108 loc) · 3.15 KB
/
get_staples.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
/***********************************************************************
* Copyright (C) 2002,2003,2004,2005,2006,2007,2008 Carsten Urbach
*
* This file is part of tmLQCD.
*
* tmLQCD is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* tmLQCD is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with tmLQCD. If not, see <http://www.gnu.org/licenses/>.
***********************************************************************/
#ifdef HAVE_CONFIG_H
# include<config.h>
#endif
#include <stdlib.h>
#include <stdio.h>
#include <math.h>
#include <time.h>
#include "global.h"
#include "su3.h"
#include "su3adj.h"
#include "start.h"
#include "get_staples.h"
#if ((defined BGL_notchecked) && (defined XLC))
su3 get_staples(int x, int mu, su3 ** in_gauge_field) {
/* We have 32 registers */
double _Complex u00, u01, u02, u10, u11, u12, u20;
double _Complex v00, v01, v02, v10, v11, v12, v20, v21, v22;
double _Complex w00, w01, w02, w10, w11, w12, w20;
double _Complex reg00, reg01, reg02, reg10, reg11, reg12, reg20, reg21, reg22;
int k, iy;
static su3 v;
su3 *w1 ALIGN;
su3 *w2 ALIGN;
su3 *w3 ALIGN;
v00 = __cmplx(0.,0.);
v01 = __cmplx(0.,0.);
v02 = __cmplx(0.,0.);
v10 = __cmplx(0.,0.);
v11 = __cmplx(0.,0.);
v12 = __cmplx(0.,0.);
v20 = __cmplx(0.,0.);
v21 = __cmplx(0.,0.);
v22 = __cmplx(0.,0.);
#pragma unroll(4)
for(k = 0; k < 4; k++) {
if(k!=mu){
w1=&in_gauge_field[x][k];
w2=&in_gauge_field[g_iup[x][k]][mu];
w3=&in_gauge_field[g_iup[x][mu]][k];
/* st = w2 * w3^d */
_su3_times_su3d(st,*w2,*w3);
/* v = v + w1 * st */
_su3_times_su3_acc(v,*w1,st);
iy=g_idn[x][k];
w1=&in_gauge_field[iy][k];
w2=&in_gauge_field[iy][mu];
w3=&in_gauge_field[g_iup[iy][mu]][k];
/* st = w2 * w3 */
/* v = v + w1^d * st */
_bgl_su3_times_su3(*w2, *w3);
_bgl_su3_times_su3_acc(*w1);
}
}
_bgl_store_vxx(v);
return(v);
}
#else
su3 get_staples(int x, int mu, su3 ** in_gauge_field) {
int k,iy;
static su3 v,st;
su3 *w1,*w2,*w3;
#ifdef _KOJAK_INST
#pragma pomp inst begin(staples)
#endif
_su3_zero(v);
for(k=0;k<4;k++) {
if(k!=mu){
w1=&in_gauge_field[x][k];
w2=&in_gauge_field[g_iup[x][k]][mu];
w3=&in_gauge_field[g_iup[x][mu]][k];
/* st = w2 * w3^d */
_su3_times_su3d(st,*w2,*w3);
/* v = v + w1 * st */
_su3_times_su3_acc(v,*w1,st);
iy=g_idn[x][k];
w1=&in_gauge_field[iy][k];
w2=&in_gauge_field[iy][mu];
w3=&in_gauge_field[g_iup[iy][mu]][k];
/* st = w2 * w3 */
_su3_times_su3(st,*w2,*w3);
/* v = v + w1^d * st */
_su3d_times_su3_acc(v,*w1,st);
}
}
return v;
#ifdef _KOJAK_INST
#pragma pomp inst end(staples)
#endif
}
#endif