From a284a7da8d1facbf984a22302665a2a50295a687 Mon Sep 17 00:00:00 2001 From: AlexeyAB <alexeyab84@gmail.com> Date: Wed, 08 Aug 2018 16:08:58 +0000 Subject: [PATCH] Try to use avx_hs() - slow and requires alignment 4096 bits < (l.size*l.size*l.c) May be faster only from 8192 bits and more. --- Makefile | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Makefile b/Makefile index 5c39df1..ba61086 100644 --- a/Makefile +++ b/Makefile @@ -29,8 +29,8 @@ # GP100/Tesla P100 � DGX-1 # ARCH= -gencode arch=compute_60,code=sm_60 -# For Jetson Tx1 uncomment: -# ARCH= -gencode arch=compute_51,code=[sm_51,compute_51] +# For Jetson TX1, Tegra X1, DRIVE CX, DRIVE PX - uncomment: +# ARCH= -gencode arch=compute_53,code=[sm_53,compute_53] # For Jetson Tx2 or Drive-PX2 uncomment: # ARCH= -gencode arch=compute_62,code=[sm_62,compute_62] -- Gitblit v1.10.0