b107fea253c6f1fd70bf93156f6cca4b8d506399
[alexxy/gromacs.git] / src / gmxlib / nonbonded / nb_kernel_x86_64_sse2 / nb_kernel_x86_64_sse2.c
1 /* -*- mode: c; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4; c-file-style: "stroustrup"; -*- 
2  *
3  * 
4  * This file is part of Gromacs        Copyright (c) 1991-2004
5  * David van der Spoel, Erik Lindahl, University of Groningen.
6  *
7  * This program is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU General Public License
9  * as published by the Free Software Foundation; either version 2
10  * of the License, or (at your option) any later version.
11  *
12  * To help us fund GROMACS development, we humbly ask that you cite
13  * the research papers on the package. Check out http://www.gromacs.org
14  * 
15  * And Hey:
16  * Gnomes, ROck Monsters And Chili Sauce
17  */
18 #ifdef HAVE_CONFIG_H
19 #include <config.h>
20 #endif
21
22 /* Must come directly after config.h */
23 #ifdef GMX_THREAD_SHM_FDECOMP
24 #include <thread_mpi.h>
25 #endif
26
27 #include <types/simple.h>
28 #include <types/nrnb.h>
29
30 #include "nb_kernel_x86_64_sse2.h"
31
32 /* Include x86_64 SSE kernel headers in local directory */
33 #include "nb_kernel010_x86_64_sse2.h"
34 #include "nb_kernel030_x86_64_sse2.h"
35 #include "nb_kernel100_x86_64_sse2.h"
36 #include "nb_kernel101_x86_64_sse2.h"
37 #include "nb_kernel102_x86_64_sse2.h"
38 #include "nb_kernel103_x86_64_sse2.h"
39 #include "nb_kernel104_x86_64_sse2.h"
40 #include "nb_kernel110_x86_64_sse2.h"
41 #include "nb_kernel111_x86_64_sse2.h"
42 #include "nb_kernel112_x86_64_sse2.h"
43 #include "nb_kernel113_x86_64_sse2.h"
44 #include "nb_kernel114_x86_64_sse2.h"
45 #include "nb_kernel130_x86_64_sse2.h"
46 #include "nb_kernel131_x86_64_sse2.h"
47 #include "nb_kernel132_x86_64_sse2.h"
48 #include "nb_kernel133_x86_64_sse2.h"
49 #include "nb_kernel134_x86_64_sse2.h"
50 #include "nb_kernel200_x86_64_sse2.h"
51 #include "nb_kernel201_x86_64_sse2.h"
52 #include "nb_kernel202_x86_64_sse2.h"
53 #include "nb_kernel203_x86_64_sse2.h"
54 #include "nb_kernel204_x86_64_sse2.h"
55 #include "nb_kernel210_x86_64_sse2.h"
56 #include "nb_kernel211_x86_64_sse2.h"
57 #include "nb_kernel212_x86_64_sse2.h"
58 #include "nb_kernel213_x86_64_sse2.h"
59 #include "nb_kernel214_x86_64_sse2.h"
60 #include "nb_kernel230_x86_64_sse2.h"
61 #include "nb_kernel231_x86_64_sse2.h"
62 #include "nb_kernel232_x86_64_sse2.h"
63 #include "nb_kernel233_x86_64_sse2.h"
64 #include "nb_kernel234_x86_64_sse2.h"
65 #include "nb_kernel300_x86_64_sse2.h"
66 #include "nb_kernel301_x86_64_sse2.h"
67 #include "nb_kernel302_x86_64_sse2.h"
68 #include "nb_kernel303_x86_64_sse2.h"
69 #include "nb_kernel304_x86_64_sse2.h"
70 #include "nb_kernel310_x86_64_sse2.h"
71 #include "nb_kernel311_x86_64_sse2.h"
72 #include "nb_kernel312_x86_64_sse2.h"
73 #include "nb_kernel313_x86_64_sse2.h"
74 #include "nb_kernel314_x86_64_sse2.h"
75 #include "nb_kernel330_x86_64_sse2.h"
76 #include "nb_kernel331_x86_64_sse2.h"
77 #include "nb_kernel332_x86_64_sse2.h"
78 #include "nb_kernel333_x86_64_sse2.h"
79 #include "nb_kernel334_x86_64_sse2.h"
80 #include "nb_kernel400_x86_64_sse2.h"
81 #include "nb_kernel410_x86_64_sse2.h"
82 #include "nb_kernel430_x86_64_sse2.h"
83
84
85
86 #include <stdlib.h>
87 #include <stdio.h>
88 /* Necessary headers for POSIX-style long jumps. */
89 #include <signal.h>
90 #include <setjmp.h>
91
92
93 #include "../nb_kerneltype.h"
94 #include "nb_kernel_x86_64_sse2.h"
95 #include "nb_kernel_x86_64_sse2_test_asm.h"
96
97
98 static nb_kernel_t *
99 kernellist_x86_64_sse2[eNR_NBKERNEL_NR] = 
100 {
101     nb_kernel010_x86_64_sse2,
102     NULL,
103     nb_kernel030_x86_64_sse2,
104     nb_kernel100_x86_64_sse2,
105     nb_kernel101_x86_64_sse2,
106     nb_kernel102_x86_64_sse2,
107     nb_kernel103_x86_64_sse2,
108     nb_kernel104_x86_64_sse2,
109     nb_kernel110_x86_64_sse2,
110     nb_kernel111_x86_64_sse2,
111     nb_kernel112_x86_64_sse2,
112     nb_kernel113_x86_64_sse2,
113     nb_kernel114_x86_64_sse2,
114     NULL,
115     NULL,
116     NULL,
117     NULL,
118     NULL,
119     nb_kernel130_x86_64_sse2,
120     nb_kernel131_x86_64_sse2,
121     nb_kernel132_x86_64_sse2,
122     nb_kernel133_x86_64_sse2,
123     nb_kernel134_x86_64_sse2,
124     nb_kernel200_x86_64_sse2,
125     nb_kernel201_x86_64_sse2,
126     nb_kernel202_x86_64_sse2,
127     nb_kernel203_x86_64_sse2,
128     nb_kernel204_x86_64_sse2,
129     nb_kernel210_x86_64_sse2,
130     nb_kernel211_x86_64_sse2,
131     nb_kernel212_x86_64_sse2,
132     nb_kernel213_x86_64_sse2,
133     nb_kernel214_x86_64_sse2,
134     NULL,
135     NULL,
136     NULL,
137     NULL,
138     NULL,
139     nb_kernel230_x86_64_sse2,
140     nb_kernel231_x86_64_sse2,
141     nb_kernel232_x86_64_sse2,
142     nb_kernel233_x86_64_sse2,
143     nb_kernel234_x86_64_sse2,
144     nb_kernel300_x86_64_sse2,
145     nb_kernel301_x86_64_sse2,
146     nb_kernel302_x86_64_sse2,
147     nb_kernel303_x86_64_sse2,
148     nb_kernel304_x86_64_sse2,
149     nb_kernel310_x86_64_sse2,
150     nb_kernel311_x86_64_sse2,
151     nb_kernel312_x86_64_sse2,
152     nb_kernel313_x86_64_sse2,
153     nb_kernel314_x86_64_sse2,
154     NULL,
155     NULL,
156     NULL,
157     NULL,
158     NULL,
159     nb_kernel330_x86_64_sse2,
160     nb_kernel331_x86_64_sse2,
161     nb_kernel332_x86_64_sse2,
162     nb_kernel333_x86_64_sse2,
163     nb_kernel334_x86_64_sse2,
164     nb_kernel400_x86_64_sse2,
165     nb_kernel410_x86_64_sse2,
166     nb_kernel430_x86_64_sse2
167 };
168
169 #ifdef GMX_THREAD_SHM_FDECOMP
170 static tMPI_Thread_mutex_t 
171 nb_kernel_x86_64_sse2_test_mutex = TMPI_THREAD_MUTEX_INITIALIZER;
172 #endif
173
174 /*! Posix long jump label */
175 static jmp_buf         
176 nb_kernel_x86_64_sse2_testprog;
177
178 /*! Result of x86_64 SSE2 test */
179 static bool
180 nb_kernel_x86_64_sse2_present;
181
182
183 static void 
184 nb_kernel_x86_64_sse2_sigill_handler(int n)
185 {
186   nb_kernel_x86_64_sse2_present=FALSE;
187   longjmp(nb_kernel_x86_64_sse2_testprog,n);
188 }
189
190
191
192
193 /* Return GMX_SUCCESS (0) if SSE2 support is present, or
194  * general error GMX_EFAILURE.
195  */
196 int 
197 nb_kernel_x86_64_sse2_test(FILE *                log)
198 {
199         /* 
200          * This should NOT be called from threads, 
201          * but just in case you still try to do it...
202          */
203 #ifdef GMX_THREAD_SHM_FDECOMP
204         tMPI_Thread_mutex_lock(&nb_kernel_x86_64_sse2_test_mutex);
205 #endif
206     
207     if(log)
208         fprintf(log,"Testing x86_64 SSE2 support...");
209
210         nb_kernel_x86_64_sse2_present = TRUE;
211         signal(SIGILL,nb_kernel_x86_64_sse2_sigill_handler);
212
213         /* return to this point after executing the signal handler
214          * if we catch a SIGILL
215          */
216         setjmp(nb_kernel_x86_64_sse2_testprog); 
217
218         if(nb_kernel_x86_64_sse2_present)
219                 nb_kernel_x86_64_sse2_test_asm();
220         
221         /* If SSE2 worked, then success is still 1.
222      * If we got SIGILL, it was set to 0 in sigill_handler().
223      */
224
225         if(log)
226                 fprintf(log," %spresent.\n", 
227                                 nb_kernel_x86_64_sse2_present ? "":"not ");
228         
229 #ifdef GMX_THREAD_SHM_FDECOMP
230         tMPI_Thread_mutex_unlock(&nb_kernel_x86_64_sse2_test_mutex);
231 #endif
232     
233         return ((nb_kernel_x86_64_sse2_present) ? 0 : -1);
234 }
235
236                                 
237
238 void
239 nb_kernel_setup_x86_64_sse2(FILE *log,nb_kernel_t **list)
240 {
241     int i;
242     nb_kernel_t *p;
243     
244     if(nb_kernel_x86_64_sse2_test(log) != 0)
245         return;
246     
247     for(i=0;i<eNR_NBKERNEL_NR;i++)
248     {
249         p = kernellist_x86_64_sse2[i];
250         if(p!=NULL)
251             list[i] = p; 
252     }
253 }