From c6ecf1e0420737eafeb99b27b1d716b46a6cbb7a Mon Sep 17 00:00:00 2001
From: Jud White <github@judsonwhite.com>
Date: Sun, 25 Mar 2018 20:41:48 +0000
Subject: [PATCH] README.md: add notes to How to compile on Windows

---
 src/cuda.h |   44 ++++++++++++++++++++++++++++++++++----------
 1 files changed, 34 insertions(+), 10 deletions(-)

diff --git a/src/cuda.h b/src/cuda.h
index cbe7975..c328fce 100644
--- a/src/cuda.h
+++ b/src/cuda.h
@@ -1,24 +1,48 @@
 #ifndef CUDA_H
 #define CUDA_H
 
+#if defined(_MSC_VER) && _MSC_VER < 1900
+	#define inline __inline
+#endif
+
 extern int gpu_index;
 
 #ifdef GPU
 
-#define BLOCK 256
+#define BLOCK 512
 
 #include "cuda_runtime.h"
+#include "curand.h"
 #include "cublas_v2.h"
 
-void check_error(cudaError_t status);
-cublasHandle_t blas_handle();
-float *cuda_make_array(float *x, int n);
-int *cuda_make_int_array(int n);
-void cuda_push_array(float *x_gpu, float *x, int n);
-void cuda_pull_array(float *x_gpu, float *x, int n);
-void cuda_free(float *x_gpu);
-float cuda_compare(float *x_gpu, float *x, int n, char *s);
-dim3 cuda_gridsize(size_t n);
+#ifdef CUDNN
+#include "cudnn.h"
+#endif
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+	void check_error(cudaError_t status);
+	cublasHandle_t blas_handle();
+	float *cuda_make_array(float *x, size_t n);
+	int *cuda_make_int_array(size_t n);
+	void cuda_push_array(float *x_gpu, float *x, size_t n);
+	void cuda_pull_array(float *x_gpu, float *x, size_t n);
+	void cuda_set_device(int n);
+	int cuda_get_device();
+	void cuda_free(float *x_gpu);
+	void cuda_random(float *x_gpu, size_t n);
+	float cuda_compare(float *x_gpu, float *x, size_t n, char *s);
+	dim3 cuda_gridsize(size_t n);
+	cudaStream_t get_cuda_stream();
+#ifdef __cplusplus
+}
+#endif
+
+#ifdef CUDNN
+cudnnHandle_t cudnn_handle();
+enum {cudnn_fastest, cudnn_smallest};
+#endif
 
 #endif
 #endif

--
Gitblit v1.10.0