ViennaCL - The Vienna Computing Library  1.6.0
Free open-source GPU-accelerated linear algebra and solver library.
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
tesla_k20m.hpp
Go to the documentation of this file.
1 #ifndef VIENNACL_DEVICE_SPECIFIC_BUILTIN_DATABASE_DEVICES_GPU_NVIDIA_KEPLER_K20M_HPP_
2 #define VIENNACL_DEVICE_SPECIFIC_BUILTIN_DATABASE_DEVICES_GPU_NVIDIA_KEPLER_K20M_HPP_
3 
5 
7 
9 
11 
13 
16 
17 namespace viennacl{
18 namespace device_specific{
19 namespace builtin_database{
20 namespace devices{
21 namespace gpu{
22 namespace nvidia{
23 namespace kepler{
24 namespace tesla_k20m{
25 
27 {
28  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,2,8,32,8,2,4,FETCH_FROM_LOCAL,FETCH_FROM_GLOBAL_STRIDED,4,16));
29 }
30 
32 {
33  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,16,16,32,2,1,4,FETCH_FROM_LOCAL,FETCH_FROM_LOCAL,16,32));
34 }
35 
37 {
38  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,2,8,64,16,1,2,FETCH_FROM_LOCAL,FETCH_FROM_GLOBAL_STRIDED,32,4));
39 }
40 
42 {
43  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,128,32,1,1,1,16,FETCH_FROM_GLOBAL_CONTIGUOUS,FETCH_FROM_LOCAL,16,8));
44 }
45 
47 {
48  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,8,32,16,4,8,4,FETCH_FROM_LOCAL,FETCH_FROM_GLOBAL_STRIDED,8,16));
49 }
50 
52 {
53  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,32,16,32,8,2,4,FETCH_FROM_LOCAL,FETCH_FROM_LOCAL,16,64));
54 }
55 
57 {
59 }
60 
62 {
63  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_product_template::parameters_type(1,128,64,1,4,2,16,FETCH_FROM_GLOBAL_STRIDED,FETCH_FROM_LOCAL,16,8));
64 }
65 
67 {
68  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", row_wise_reduction_template::parameters_type(1,2,64,1024,FETCH_FROM_GLOBAL_STRIDED));
69 }
70 
72 {
74 }
75 
77 {
78  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", row_wise_reduction_template::parameters_type(1,1,128,2048,FETCH_FROM_GLOBAL_STRIDED));
79 }
80 
82 {
84 }
85 
87 {
88  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", reduction_template::parameters_type(1,256,4096,FETCH_FROM_GLOBAL_STRIDED));
89 }
90 
92 {
93  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", reduction_template::parameters_type(1,128,512,FETCH_FROM_GLOBAL_STRIDED));
94 }
95 
97 {
98  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_axpy_template::parameters_type(1,64,8,128,128,FETCH_FROM_GLOBAL_STRIDED));
99 }
100 
102 {
103  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", matrix_axpy_template::parameters_type(1,32,4,128,128,FETCH_FROM_GLOBAL_CONTIGUOUS));
104 }
105 
107 {
108  db.add_8B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", vector_axpy_template::parameters_type(1,256,16384,FETCH_FROM_GLOBAL_STRIDED));
109 }
110 
112 {
113  db.add_4B(nvidia_id, CL_DEVICE_TYPE_GPU, ocl::unknown, "Tesla K20m", vector_axpy_template::parameters_type(1,256,16384,FETCH_FROM_GLOBAL_STRIDED));
114 }
115 
116 }
117 }
118 }
119 }
120 }
121 }
122 }
123 }
124 #endif
database_type< ParamT > & add_8B(vendor_id_type p0, device_type p1, ocl::device_architecture_family p2, device_name_type p3, ParamT const &p5)
Definition: common.hpp:83
database_type< ParamT > & add_4B(vendor_id_type p0, device_type p1, ocl::device_architecture_family p2, device_name_type p3, ParamT const &p5)
Definition: common.hpp:76
void add_4B(database_type< matrix_product_template::parameters_type > &db, char_to_type<'T'>, char_to_type<'T'>)
Definition: tesla_k20m.hpp:46
Forwards declaration.
void add_8B(database_type< matrix_product_template::parameters_type > &db, char_to_type<'T'>, char_to_type<'T'>)
Definition: tesla_k20m.hpp:26