package com.sheepit.client.hardware.gpu.nvidia; import java.util.HashMap; import java.util.LinkedList; import java.util.List; import java.util.Map; import com.sheepit.client.hardware.gpu.nvidia.CUDeviceAttribute; import com.sheepit.client.hardware.gpu.GPUDevice; import com.sheepit.client.hardware.gpu.GPULister; import com.sheepit.client.os.OS; import com.sun.jna.Native; import com.sun.jna.ptr.IntByReference; import com.sun.jna.ptr.LongByReference; public class Nvidia implements GPULister { public static String TYPE = "CUDA"; @Override public List getGpus() { OS os = OS.getOS(); String path = os.getCUDALib(); if (path == null) { return null; } CUDA cudalib = null; try { cudalib = (CUDA) Native.loadLibrary(path, CUDA.class); } catch (java.lang.UnsatisfiedLinkError e) { return null; } catch (java.lang.ExceptionInInitializerError e) { System.out.println("Nvidia::getGpus ExceptionInInitializerError " + e); return null; } catch (Exception e) { System.out.println("Nvidia::getGpus generic exception " + e); return null; } int result = CUresult.CUDA_ERROR_UNKNOWN; result = cudalib.cuInit(0); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuInit failed (ret: " + result + ")"); if (result == CUresult.CUDA_ERROR_UNKNOWN) { System.out.println("If you are running Linux, this error is usually due to nvidia kernel module 'nvidia_uvm' not loaded."); System.out.println("Relaunch the application as root or load the module."); System.out.println("Most of time it does fix the issue."); } return null; } if (result == CUresult.CUDA_ERROR_NO_DEVICE) { return null; } IntByReference count = new IntByReference(); result = cudalib.cuDeviceGetCount(count); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGetCount failed (ret: " + CUresult.stringFor(result) + ")"); return null; } List devices = new LinkedList(); HashMap devicesWithPciId = new HashMap(count.getValue()); for (int num = 0; num < count.getValue(); num++) { IntByReference aDevice = new IntByReference(); result = cudalib.cuDeviceGet(aDevice, num); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGet failed (ret: " + CUresult.stringFor(result) + ")"); continue; } IntByReference pciDomainId = new IntByReference(); IntByReference pciBusId = new IntByReference(); IntByReference pciDeviceId = new IntByReference(); result = cudalib.cuDeviceGetAttribute(pciDomainId, CUDeviceAttribute.CU_DEVICE_ATTRIBUTE_PCI_DOMAIN_ID, aDevice.getValue()); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGetAttribute for CU_DEVICE_ATTRIBUTE_PCI_DOMAIN_ID failed (ret: " + CUresult.stringFor(result) + ")"); continue; } result = cudalib.cuDeviceGetAttribute(pciBusId, CUDeviceAttribute.CU_DEVICE_ATTRIBUTE_PCI_BUS_ID, aDevice.getValue()); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGetAttribute for CU_DEVICE_ATTRIBUTE_PCI_BUS_ID failed (ret: " + CUresult.stringFor(result) + ")"); continue; } result = cudalib.cuDeviceGetAttribute(pciDeviceId, CUDeviceAttribute.CU_DEVICE_ATTRIBUTE_PCI_DEVICE_ID, aDevice.getValue()); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGetAttribute for CU_DEVICE_ATTRIBUTE_PCI_DEVICE_ID failed (ret: " + CUresult.stringFor(result) + ")"); continue; } byte name[] = new byte[256]; result = cudalib.cuDeviceGetName(name, 256, num); if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceGetName failed (ret: " + CUresult.stringFor(result) + ")"); continue; } LongByReference ram = new LongByReference(); try { result = cudalib.cuDeviceTotalMem_v2(ram, num); } catch (UnsatisfiedLinkError e) { // fall back to old function result = cudalib.cuDeviceTotalMem(ram, num); } if (result != CUresult.CUDA_SUCCESS) { System.out.println("Nvidia::getGpus cuDeviceTotalMem failed (ret: " + CUresult.stringFor(result) + ")"); return null; } String blenderId = String.format("CUDA_%s_%04x:%02x:%02x", new String(name).trim(), pciDomainId.getValue(), pciBusId.getValue(), pciDeviceId.getValue()); devicesWithPciId.put(Integer.toString(pciBusId.getValue()), new GPUDevice(TYPE, new String(name).trim(), ram.getValue(), blenderId)); } // for backward compatibility generate a CUDA_N id // in theory a set to environment "CUDA_DEVICE_ORDER=PCI_BUS_ID" should be enough but it didn't work int i = 0; for (Map.Entry entry : devicesWithPciId.entrySet()){ GPUDevice aDevice = entry.getValue(); aDevice.setOldId(TYPE + "_" + Integer.toString(i)); devices.add(aDevice); i++; } return devices; } }