ViennaCL - The Vienna Computing Library
1.6.1
Free open-source GPU-accelerated linear algebra and solver library.
geforce_gt_540m.hpp
Go to the documentation of this file.
1
#ifndef VIENNACL_DEVICE_SPECIFIC_BUILTIN_DATABASE_DEVICES_GPU_NVIDIA_FERMI_GT540M_HPP_
2
#define VIENNACL_DEVICE_SPECIFIC_BUILTIN_DATABASE_DEVICES_GPU_NVIDIA_FERMI_GT540M_HPP_
3
4
#include "
viennacl/device_specific/templates/matrix_axpy_template.hpp
"
5
6
#include "
viennacl/device_specific/templates/matrix_product_template.hpp
"
7
8
#include "
viennacl/device_specific/templates/row_wise_reduction_template.hpp
"
9
10
#include "
viennacl/device_specific/templates/vector_axpy_template.hpp
"
11
12
#include "
viennacl/device_specific/forwards.h
"
13
#include "
viennacl/device_specific/builtin_database/common.hpp
"
14
15
namespace
viennacl
{
16
namespace
device_specific{
17
namespace
builtin_database{
18
namespace
devices{
19
namespace
gpu{
20
namespace
nvidia{
21
namespace
fermi
{
22
namespace
geforce_gt_540m{
23
24
inline
void
add_4B
(
database_type<vector_axpy_template::parameters_type>
& db)
25
{
26
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
vector_axpy_template::parameters_type
(1, 512, 512,
FETCH_FROM_GLOBAL_STRIDED
));
27
}
28
29
inline
void
add_4B
(
database_type<matrix_product_template::parameters_type>
& db,
char_to_type<'T'>
,
char_to_type<'N'>
)
30
{
31
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
matrix_product_template::parameters_type
(1, 16, 16, 8, 4, 1, 8,
FETCH_FROM_LOCAL
,
FETCH_FROM_LOCAL
, 16, 8));
32
}
33
34
inline
void
add_4B
(
database_type<matrix_product_template::parameters_type>
& db,
char_to_type<'N'>
,
char_to_type<'T'>
)
35
{
36
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
matrix_product_template::parameters_type
(1, 16, 16, 16, 8, 1, 4,
FETCH_FROM_LOCAL
,
FETCH_FROM_LOCAL
, 32, 8));
37
}
38
39
inline
void
add_4B
(
database_type<matrix_product_template::parameters_type>
& db,
char_to_type<'N'>
,
char_to_type<'N'>
)
40
{
41
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
matrix_product_template::parameters_type
(1, 8, 16, 16, 8, 1, 4,
FETCH_FROM_LOCAL
,
FETCH_FROM_LOCAL
, 16, 8));
42
}
43
44
inline
void
add_8B
(
database_type<row_wise_reduction_template::parameters_type>
& db,
char_to_type<'T'>
)
45
{
46
db.
add_8B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
row_wise_reduction_template::parameters_type
(4, 1, 256, 1024,
FETCH_FROM_GLOBAL_STRIDED
));
47
}
48
49
inline
void
add_8B
(
database_type<row_wise_reduction_template::parameters_type>
& db,
char_to_type<'N'>
)
50
{
51
db.
add_8B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
row_wise_reduction_template::parameters_type
(4, 1024, 1, 16,
FETCH_FROM_GLOBAL_STRIDED
));
52
}
53
54
inline
void
add_4B
(
database_type<row_wise_reduction_template::parameters_type>
& db,
char_to_type<'T'>
)
55
{
56
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
row_wise_reduction_template::parameters_type
(4, 1, 256, 2048,
FETCH_FROM_GLOBAL_STRIDED
));
57
}
58
59
inline
void
add_4B
(
database_type<row_wise_reduction_template::parameters_type>
& db,
char_to_type<'N'>
)
60
{
61
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
row_wise_reduction_template::parameters_type
(4, 32, 16, 128,
FETCH_FROM_GLOBAL_STRIDED
));
62
}
63
64
inline
void
add_8B
(
database_type<matrix_axpy_template::parameters_type>
& db)
65
{
66
db.
add_8B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
matrix_axpy_template::parameters_type
(1, 1, 128, 32, 16,
FETCH_FROM_GLOBAL_STRIDED
));
67
}
68
69
inline
void
add_4B
(
database_type<matrix_axpy_template::parameters_type>
& db)
70
{
71
db.
add_4B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
matrix_axpy_template::parameters_type
(1, 1, 128, 4, 4,
FETCH_FROM_GLOBAL_STRIDED
));
72
}
73
74
inline
void
add_8B
(
database_type<vector_axpy_template::parameters_type>
& db)
75
{
76
db.
add_8B
(
nvidia_id
, CL_DEVICE_TYPE_GPU,
ocl::fermi
,
"GeForce GT 540M"
,
vector_axpy_template::parameters_type
(1, 512, 2048,
FETCH_FROM_GLOBAL_STRIDED
));
77
}
78
79
}
80
}
81
}
82
}
83
}
84
}
85
}
86
}
87
#endif
viennacl::ocl::fermi
Definition:
device_utils.hpp:59
viennacl::ocl::nvidia_id
Definition:
device_utils.hpp:49
viennacl::device_specific::builtin_database::database_type
Definition:
common.hpp:44
matrix_product_template.hpp
viennacl::device_specific::builtin_database::devices::gpu::nvidia::fermi::geforce_gt_540m::add_8B
void add_8B(database_type< row_wise_reduction_template::parameters_type > &db, char_to_type<'T'>)
Definition:
geforce_gt_540m.hpp:44
viennacl
Main namespace in ViennaCL. Holds all the basic types such as vector, matrix, etc. and defines operations upon them.
Definition:
cpu_ram.hpp:29
viennacl::device_specific::builtin_database::database_type::add_8B
database_type< ParamT > & add_8B(vendor_id_type p0, device_type p1, ocl::device_architecture_family p2, device_name_type p3, ParamT const &p5)
Definition:
common.hpp:83
viennacl::device_specific::FETCH_FROM_GLOBAL_STRIDED
Definition:
template_base.hpp:50
common.hpp
viennacl::device_specific::builtin_database::database_type::add_4B
database_type< ParamT > & add_4B(vendor_id_type p0, device_type p1, ocl::device_architecture_family p2, device_name_type p3, ParamT const &p5)
Definition:
common.hpp:76
matrix_axpy_template.hpp
viennacl::device_specific::char_to_type
Definition:
forwards.h:249
forwards.h
Forwards declaration.
vector_axpy_template.hpp
viennacl::device_specific::FETCH_FROM_LOCAL
Definition:
template_base.hpp:49
row_wise_reduction_template.hpp
viennacl::device_specific::builtin_database::devices::gpu::nvidia::fermi::geforce_gt_540m::add_4B
void add_4B(database_type< vector_axpy_template::parameters_type > &db)
Definition:
geforce_gt_540m.hpp:24
viennacl::device_specific::template_base::parameters_type
Definition:
template_base.hpp:57
viennacl::device_specific::template_base_impl< vector_axpy_template, vector_axpy_parameters >::parameters_type
vector_axpy_parameters parameters_type
Definition:
template_base.hpp:527
viennacl
device_specific
builtin_database
devices
gpu
nvidia
fermi
geforce_gt_540m.hpp
Generated on Thu Nov 20 2014 15:15:30 for ViennaCL - The Vienna Computing Library by
1.8.8