flops: unroll by 16
This commit is contained in:
@@ -5,7 +5,7 @@ __kernel void flops (__global volatile const float *src,
|
|||||||
int gid = get_global_id(0);
|
int gid = get_global_id(0);
|
||||||
float f = 0.0f;
|
float f = 0.0f;
|
||||||
float incr = src[0];
|
float incr = src[0];
|
||||||
__attribute__((opencl_unroll_hint))
|
__attribute__((opencl_unroll_hint(16)))
|
||||||
for (int i = 0; i < 5000; i++) {
|
for (int i = 0; i < 5000; i++) {
|
||||||
f += incr;
|
f += incr;
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user