kernel1.cl 4.57 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
/*

OCLADock, an OpenCL implementation of AutoDock 4.2 running a Lamarckian Genetic Algorithm
Copyright (C) 2017 TU Darmstadt, Embedded Systems and Applications Group, Germany. All rights reserved.

AutoDock is a Trade Mark of the Scripps Research Institute.

This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License
as published by the Free Software Foundation; either version 2
of the License, or (at your option) any later version.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.

*/


Leonardo Solis's avatar
Leonardo Solis committed
25
__kernel void __attribute__ ((reqd_work_group_size(NUM_OF_THREADS_PER_BLOCK,1,1)))
26
27
gpu_calc_initpop(	
			char   dockpars_num_of_atoms,
Leonardo Solis's avatar
Leonardo Solis committed
28
29
30
31
32
33
			char   dockpars_num_of_atypes,
			int    dockpars_num_of_intraE_contributors,
			char   dockpars_gridsize_x,
			char   dockpars_gridsize_y,
			char   dockpars_gridsize_z,
			float  dockpars_grid_spacing,
34
	 __global const float* restrict dockpars_fgrids, // This is too large to be allocated in __constant 
Leonardo Solis's avatar
Leonardo Solis committed
35
36
37
			int    dockpars_rotbondlist_length,
			float  dockpars_coeff_elec,
			float  dockpars_coeff_desolv,
38
39
40
	 __global const float* restrict dockpars_conformations_current,
	 __global       float* restrict dockpars_energies_current,
	 __global       int*   restrict dockpars_evals_of_new_entities,
Leonardo Solis's avatar
Leonardo Solis committed
41
42
			int    dockpars_pop_size,
			float  dockpars_qasp,
43
44
45
46
47
48
49
50
51
52
53
54
55
56
	     __constant float* atom_charges_const,
             __constant char*  atom_types_const,
	     __constant char*  intraE_contributors_const,
             __constant float* VWpars_AC_const,
             __constant float* VWpars_BD_const,
             __constant float* dspars_S_const,
             __constant float* dspars_V_const,
             __constant int*   rotlist_const,
             __constant float* ref_coords_x_const,
             __constant float* ref_coords_y_const,
             __constant float* ref_coords_z_const,
             __constant float* rotbonds_moving_vectors_const,
             __constant float* rotbonds_unit_vectors_const,
             __constant float* ref_orientation_quats_const
Leonardo Solis's avatar
Leonardo Solis committed
57
){
58
59
60
61
        // Some OpenCL compilers don't allow declaring 
	// local variables within non-kernel functions.
	// These local variables must be declared in a kernel, 
	// and then passed to non-kernel functions.
62
	__local float  genotype[ACTUAL_GENOTYPE_LENGTH];
63
64
65
	__local float  energy;
	__local int    run_id;

Leonardo Solis's avatar
Leonardo Solis committed
66
67
68
69
	__local float calc_coords_x[MAX_NUM_OF_ATOMS];
	__local float calc_coords_y[MAX_NUM_OF_ATOMS];
	__local float calc_coords_z[MAX_NUM_OF_ATOMS];
	__local float partial_energies[NUM_OF_THREADS_PER_BLOCK];
Leonardo Solis's avatar
Leonardo Solis committed
70

71
	// Copying genotype from global memory
Leonardo Solis's avatar
Leonardo Solis committed
72
	event_t ev = async_work_group_copy(genotype,
Leonardo Solis's avatar
Leonardo Solis committed
73
74
			                   dockpars_conformations_current + GENOTYPE_LENGTH_IN_GLOBMEM*get_group_id(0),
			                   GENOTYPE_LENGTH_IN_GLOBMEM, 0);
Leonardo Solis's avatar
Leonardo Solis committed
75
76
77

	wait_group_events(1,&ev);

78
79
	// Determining run-ID
	if (get_local_id(0) == 0) {
Leonardo Solis's avatar
Leonardo Solis committed
80
		run_id = get_group_id(0) / dockpars_pop_size;
81
	}
Leonardo Solis's avatar
Leonardo Solis committed
82
83

	// =============================================================
Leonardo Solis's avatar
Leonardo Solis committed
84
	// WARNING: only energy of work-item=0 will be valid
Leonardo Solis's avatar
Leonardo Solis committed
85
	gpu_calc_energy(dockpars_rotbondlist_length,
Leonardo Solis's avatar
Leonardo Solis committed
86
87
88
89
90
91
92
93
94
95
96
97
98
99
			dockpars_num_of_atoms,
			dockpars_gridsize_x,
			dockpars_gridsize_y,
			dockpars_gridsize_z,
			dockpars_fgrids,
			dockpars_num_of_atypes,
			dockpars_num_of_intraE_contributors,
			dockpars_grid_spacing,
			dockpars_coeff_elec,
			dockpars_qasp,
			dockpars_coeff_desolv,
			genotype,
			&energy,
			&run_id,
100
101
102
103
			// Some OpenCL compilers don't allow declaring 
			// local variables within non-kernel functions.
			// These local variables must be declared in a kernel, 
			// and then passed to non-kernel functions.
Leonardo Solis's avatar
Leonardo Solis committed
104
105
106
107
			calc_coords_x,
			calc_coords_y,
			calc_coords_z,
			partial_energies,
Leonardo Solis's avatar
Leonardo Solis committed
108

Leonardo Solis's avatar
Leonardo Solis committed
109
110
111
112
113
114
115
116
117
118
119
120
121
	                atom_charges_const,
		        atom_types_const,
			intraE_contributors_const,
			VWpars_AC_const,
			VWpars_BD_const,
			dspars_S_const,
			dspars_V_const,
			rotlist_const,
			ref_coords_x_const,
			ref_coords_y_const,
			ref_coords_z_const,
			rotbonds_moving_vectors_const,
			rotbonds_unit_vectors_const,
122
123
			ref_orientation_quats_const
			);
Leonardo Solis's avatar
Leonardo Solis committed
124
125
	// =============================================================

Leonardo Solis's avatar
Leonardo Solis committed
126
127
128
129
	if (get_local_id(0) == 0) {
		dockpars_energies_current[get_group_id(0)] = energy;
		dockpars_evals_of_new_entities[get_group_id(0)] = 1;
	}
Leonardo Solis's avatar
Leonardo Solis committed
130
}