From 08b757a0bf76efe8c76b453063a1bb19315bcaa6 Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Wed, 14 Jan 2015 20:18:57 +0000
Subject: [PATCH] Stable, needs to be way faster
---
src/axpy.cl | 24 ++++++++++++++++++++++++
1 files changed, 24 insertions(+), 0 deletions(-)
diff --git a/src/axpy.cl b/src/axpy.cl
index e69de29..1503e8f 100644
--- a/src/axpy.cl
+++ b/src/axpy.cl
@@ -0,0 +1,24 @@
+__kernel void axpy(int N, float ALPHA, __global float *X, int OFFX, int INCX, __global float *Y, int OFFY, int INCY)
+{
+ int i = get_global_id(0);
+ Y[OFFY+i*INCY] += ALPHA*X[OFFX+i*INCX];
+}
+
+__kernel void scal(int N, float ALPHA, __global float *X, int INCX)
+{
+ int i = get_global_id(0);
+ X[i*INCX] *= ALPHA;
+}
+
+__kernel void mask(int n, __global float *x, __global float *mask, int mod)
+{
+ int i = get_global_id(0);
+ x[i] = (i%mod && !mask[(i/mod)*mod]) ? 0 : x[i];
+}
+
+__kernel void copy(int N, __global float *X, int OFFX, int INCX, __global float *Y, int OFFY, int INCY)
+{
+ int i = get_global_id(0);
+ Y[i*INCY + OFFY] = X[i*INCX + OFFX];
+}
+
--
Gitblit v1.10.0