From 14303717dcddae43cdc55beb0685dae86f566fd8 Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Sat, 25 Oct 2014 18:57:26 +0000
Subject: [PATCH] Fast, needs to be faster

---
 src/opencl.c |   33 ++++++++++++++++++++++++++++++---
 1 files changed, 30 insertions(+), 3 deletions(-)

diff --git a/src/opencl.c b/src/opencl.c
index bcc0f09..604a2e3 100644
--- a/src/opencl.c
+++ b/src/opencl.c
@@ -1,11 +1,13 @@
 #ifdef GPU
-#include "opencl.h"
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <time.h>
 #include <unistd.h>
+#include <clBLAS.h>
 
+#include "opencl.h"
+#include "utils.h"
 
 cl_info cl = {0};
 
@@ -79,9 +81,9 @@
 
     }
     int index = getpid()%num_devices;
+    index = 1;
     printf("%d rand, %d devices, %d index\n", getpid(), num_devices, index);
-    //info.device = devices[index];
-    info.device = devices[0];
+    info.device = devices[index];
     fprintf(stderr, "Found %d device(s)\n", num_devices);
     check_error(info);
 
@@ -93,16 +95,31 @@
     check_error(info);
     info.queue = clCreateCommandQueue(info.context, info.device, 0, &info.error);
     check_error(info);
+    for(i = 0; i < NUM_QUEUES; ++i){
+        info.queues[i] = clCreateCommandQueue(info.context, info.device, 0, &info.error);
+        check_error(info);
+    }
+    info.error = clblasSetup();
+    check_error(info);
     info.initialized = 1;
     return info;
 }
 
+void wait_for_queues()
+{
+    int i;
+    for(i = 0; i < NUM_QUEUES; ++i){
+        clFinish(cl.queues[i]);
+    }
+}
+
 cl_program cl_fprog(char *filename, char *options, cl_info info)
 {
 	size_t srcsize;
 	char src[64*1024];
 	memset(src, 0, 64*1024);
 	FILE *fil=fopen(filename,"r");
+    if(fil == 0) file_error(filename);
 	srcsize=fread(src, sizeof src, 1, fil);
 	fclose(fil);
 	const char *srcptr[]={src};
@@ -178,4 +195,14 @@
     return mem;
 }
 
+cl_mem cl_make_int_array(int *x, int n)
+{
+    cl_setup();
+    cl_mem mem = clCreateBuffer(cl.context,
+            CL_MEM_READ_WRITE|CL_MEM_COPY_HOST_PTR,
+            sizeof(int)*n, x, &cl.error);
+    check_error(cl);
+    return mem;
+}
+
 #endif

--
Gitblit v1.10.0