| 
					
				 | 
			
			
				@@ -22,6 +22,46 @@ void DetermineIfValidCudaDevice() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+EXPORT int choose_cuda_device() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+{ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  int nDevices = 0; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  cudaError_t err = cudaGetDeviceCount(&nDevices); 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  if (err != cudaSuccess) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    std::cerr << "Failed to retrieve the number of CUDA enabled devices" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+              << std::endl; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    return 1; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  for (int i = 0; i < nDevices; ++i) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    cudaDeviceProp prop; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    cudaError_t err = cudaGetDeviceProperties(&prop, i); 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    if (err != cudaSuccess) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      std::cerr << "Could not retrieve properties from CUDA device " << i 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                << std::endl; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      return 1; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    if (prop.major >= 4) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        err = cudaSetDevice(i); 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        if (err != cudaSuccess) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+          { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+          std::cout << "Could not select CUDA device " << i << std::endl; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+          } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        else 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+          { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            return 0; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+          } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+      } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  std::cout << "Could not find a CUDA enabled card supporting compute >=3.0" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            << std::endl; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+  return 1; 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+} 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 EXPORT void cuda_dynamic_lib_func() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 { 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				   DetermineIfValidCudaDevice <<<1,1>>> (); 
			 |