From 4ac78c89269138b4623993f9f1d81829d8e88131 Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Tue, 20 Jan 2015 21:26:46 +0000
Subject: [PATCH] I am so done with opencl, switching to cuda
---
src/gemm.c | 6 +-----
1 files changed, 1 insertions(+), 5 deletions(-)
diff --git a/src/gemm.c b/src/gemm.c
index 8394991..9797b85 100644
--- a/src/gemm.c
+++ b/src/gemm.c
@@ -164,8 +164,7 @@
#define TILE 64
#define TILE_K 16
-#define WPT 8
-#define THREADS (TILE*TILE)/(WPT*WPT)
+#define THREADS 64
cl_kernel get_gemm_nn_fast_kernel()
{
@@ -175,7 +174,6 @@
gemm_kernel = get_kernel("src/gemm_fast.cl", "gemm_nn_fast", "-D TILE=" STR(TILE)
" -cl-nv-verbose "
" -D TILE_K=" STR(TILE_K)
- " -D WPT=" STR(WPT)
" -D THREADS=" STR(THREADS));
init = 1;
}
@@ -464,7 +462,6 @@
test_gpu_accuracy(0,0,128,128,128);
-/*
time_ongpu(0,0,64,2916,363);
time_ongpu_fast(0,0,64,2916,363);
time_ongpu(0,0,64,2916,363);
@@ -483,7 +480,6 @@
time_ongpu_fast(0,0,128,4096,12544);
time_ongpu(0,0,128,4096,4096);
time_ongpu_fast(0,0,128,4096,4096);
- */
// time_ongpu(1,0,2304,196,256);
// time_ongpu_fast(1,0,2304,196,256);
// time_ongpu(0,1,256,2304,196);
--
Gitblit v1.10.0