Added a quick printout of the hardware info. Running into a problem choosing between platforms, going to abstract CL out into it's own class and hide all that logic

2016-08-14 00:03:44 -07:00
parent 3c9b39f682
commit edd8075afb
19 changed files with 2159 additions and 2084 deletions
--- a/kernels/kernel.txt
+++ b/kernels/kernel.txt
@@ -1,32 +1,32 @@
-__constant sampler_t sampler =
-      CLK_NORMALIZED_COORDS_FALSE
-    | CLK_ADDRESS_CLAMP_TO_EDGE
-    | CLK_FILTER_NEAREST;
-
-__constant int FILTER_SIZE = 10;
-
-float FilterValue (__constant const float* filterWeights,
-    const int x, const int y)
-{
-    return filterWeights[(x+FILTER_SIZE) + (y+FILTER_SIZE)*(FILTER_SIZE*2 + 1)];
-}
-
-__kernel void Filter (
-    __read_only image2d_t input,
-    __constant float* filterWeights,
-    __write_only image2d_t output)
-{
-    const int2 pos = {get_global_id(0), get_global_id(1)};
-
-    float4 sum = (float4)(0.0f);
-    for(int y = -FILTER_SIZE; y <= FILTER_SIZE; y++) {
-        for(int x = -FILTER_SIZE; x <= FILTER_SIZE; x++) {
-            sum += FilterValue(filterWeights, x, y)
-                * read_imagef(input, sampler, pos + (int2)(x,y));
-        }
-    }
-
-    write_imagef (output, (int2)(pos.x, pos.y), sum);
-}
-
-
+__constant sampler_t sampler =
+      CLK_NORMALIZED_COORDS_FALSE
+    | CLK_ADDRESS_CLAMP_TO_EDGE
+    | CLK_FILTER_NEAREST;
+
+__constant int FILTER_SIZE = 10;
+
+float FilterValue (__constant const float* filterWeights,
+    const int x, const int y)
+{
+    return filterWeights[(x+FILTER_SIZE) + (y+FILTER_SIZE)*(FILTER_SIZE*2 + 1)];
+}
+
+__kernel void Filter (
+    __read_only image2d_t input,
+    __constant float* filterWeights,
+    __write_only image2d_t output)
+{
+    const int2 pos = {get_global_id(0), get_global_id(1)};
+
+    float4 sum = (float4)(0.0f);
+    for(int y = -FILTER_SIZE; y <= FILTER_SIZE; y++) {
+        for(int x = -FILTER_SIZE; x <= FILTER_SIZE; x++) {
+            sum += FilterValue(filterWeights, x, y)
+                * read_imagef(input, sampler, pos + (int2)(x,y));
+        }
+    }
+
+    write_imagef (output, (int2)(pos.x, pos.y), sum);
+}
+
+