Return max memory

This commit is contained in:
Andrzej Janik
2020-02-17 21:14:23 +01:00
parent 796e030c4e
commit 925af66b19
3 changed files with 110 additions and 17 deletions

View File

@ -11,10 +11,12 @@ pub unsafe extern "C" fn cuGetExportTable(
) -> cu::Result { ) -> cu::Result {
if *id == CU_ETID_ToolsRuntimeCallbackHooks { if *id == CU_ETID_ToolsRuntimeCallbackHooks {
*table = TABLE0.as_ptr() as *const _; *table = TABLE0.as_ptr() as *const _;
return cu::Result::SUCCESS;
} else if *id == CU_ETID_CudartInterface { } else if *id == CU_ETID_CudartInterface {
*table = TABLE1.as_ptr() as *const _; *table = TABLE1.as_ptr() as *const _;
return cu::Result::SUCCESS;
} }
return cu::Result::SUCCESS; cu::Result::ERROR_NOT_SUPPORTED
} }
const CU_ETID_ToolsRuntimeCallbackHooks: cu::Uuid = cu::Uuid { const CU_ETID_ToolsRuntimeCallbackHooks: cu::Uuid = cu::Uuid {

View File

@ -5,17 +5,31 @@ extern crate lazy_static;
use std::sync::Mutex; use std::sync::Mutex;
use std::ptr; use std::ptr;
use std::cmp; use std::cmp;
use std::os::raw::{c_char, c_int}; use std::os::raw::{c_char, c_int, c_uint};
mod cu; mod cu;
mod export_table; mod export_table;
mod ze;
use ze::Versioned;
macro_rules! l0_check_err {
($exp:expr) => {
{
let result = unsafe{ $exp };
if result != l0::ze_result_t::ZE_RESULT_SUCCESS {
return Err(result);
}
}
};
}
macro_rules! l0_check { macro_rules! l0_check {
($exp:expr) => { ($exp:expr) => {
{ {
let result = unsafe{ $exp }; let result = unsafe{ $exp };
if result != l0::ze_result_t::ZE_RESULT_SUCCESS { if result != l0::ze_result_t::ZE_RESULT_SUCCESS {
return Err(result) return result;
} }
} }
}; };
@ -36,11 +50,11 @@ impl Driver {
fn new() -> Result<Driver, l0::ze_result_t> { fn new() -> Result<Driver, l0::ze_result_t> {
let mut driver_count = 1; let mut driver_count = 1;
let mut handle = ptr::null_mut(); let mut handle = ptr::null_mut();
l0_check!{ l0::zeDriverGet(&mut driver_count, &mut handle) }; l0_check_err!{ l0::zeDriverGet(&mut driver_count, &mut handle) };
let mut count = 0; let mut count = 0;
l0_check! { l0::zeDeviceGet(handle, &mut count, ptr::null_mut()) } l0_check_err! { l0::zeDeviceGet(handle, &mut count, ptr::null_mut()) }
let mut devices = vec![ptr::null_mut(); count as usize]; let mut devices = vec![ptr::null_mut(); count as usize];
l0_check! { l0::zeDeviceGet(handle, &mut count, devices.as_mut_ptr()) } l0_check_err! { l0::zeDeviceGet(handle, &mut count, devices.as_mut_ptr()) }
if (count as usize) < devices.len() { if (count as usize) < devices.len() {
devices.truncate(count as usize); devices.truncate(count as usize);
} }
@ -67,7 +81,7 @@ impl Driver {
} }
fn device_get(&self, device: *mut cu::Device, ordinal: c_int) -> l0::ze_result_t { fn device_get(&self, device: *mut cu::Device, ordinal: c_int) -> l0::ze_result_t {
if ordinal < 0 || (ordinal as usize) >= self.devices.len() { if (ordinal as usize) >= self.devices.len() {
return l0::ze_result_t::ZE_RESULT_ERROR_INVALID_ARGUMENT; return l0::ze_result_t::ZE_RESULT_ERROR_INVALID_ARGUMENT;
} }
unsafe { *device = cu::Device(ordinal) }; unsafe { *device = cu::Device(ordinal) };
@ -75,35 +89,55 @@ impl Driver {
} }
fn device_get_name(&self, name: *mut c_char, len: c_int, cu::Device(dev): cu::Device) -> l0::ze_result_t { fn device_get_name(&self, name: *mut c_char, len: c_int, cu::Device(dev): cu::Device) -> l0::ze_result_t {
if len <= 0 || dev < 0 || (dev as usize) >= self.devices.len() { if (dev as usize) >= self.devices.len() {
return l0::ze_result_t::ZE_RESULT_ERROR_INVALID_ARGUMENT; return l0::ze_result_t::ZE_RESULT_ERROR_INVALID_ARGUMENT;
} }
let mut props = Box::new(unsafe { std::mem::zeroed::<l0::ze_device_properties_t>() }); let mut props = Box::new(l0::ze_device_properties_t::new());
props.version = l0::ze_device_properties_version_t::ZE_DEVICE_PROPERTIES_VERSION_CURRENT; l0_check! { l0::zeDeviceGetProperties(self.devices[dev as usize], props.as_mut()) };
let result = unsafe { l0::zeDeviceGetProperties(self.devices[dev as usize], props.as_mut()) };
if result != l0::ze_result_t::ZE_RESULT_SUCCESS {
return result;
}
let null_pos = props.name.iter().position(|&c| c == 0).unwrap_or(0); let null_pos = props.name.iter().position(|&c| c == 0).unwrap_or(0);
let dst_null_pos = cmp::min((len - 1) as usize, null_pos); let dst_null_pos = cmp::min((len - 1) as usize, null_pos);
unsafe { *(name.add(dst_null_pos)) = 0 }; unsafe { *(name.add(dst_null_pos)) = 0 };
unsafe { std::ptr::copy_nonoverlapping(props.name.as_ptr(), name, dst_null_pos) }; unsafe { std::ptr::copy_nonoverlapping(props.name.as_ptr(), name, dst_null_pos) };
l0::ze_result_t::ZE_RESULT_SUCCESS l0::ze_result_t::ZE_RESULT_SUCCESS
} }
fn device_total_mem(&self, bytes: *mut usize, cu::Device(dev): cu::Device) -> l0::ze_result_t {
if (dev as usize) >= self.devices.len() {
return l0::ze_result_t::ZE_RESULT_ERROR_INVALID_ARGUMENT;
}
let dev = dev as usize;
let mut count = 0;
l0_check! { l0::zeDeviceGetMemoryProperties(self.devices[dev], &mut count, ptr::null_mut()) };
if count == 0 {
return l0::ze_result_t::ZE_RESULT_ERROR_UNKNOWN;
}
let mut props = vec![l0::ze_device_memory_properties_t::new(); count as usize];
l0_check! { l0::zeDeviceGetMemoryProperties(self.devices[dev], &mut count, props.as_mut_ptr()) };
let iter_count = cmp::min(count as usize, props.len());
if iter_count == 0 {
return l0::ze_result_t::ZE_RESULT_ERROR_UNKNOWN;
}
let max_mem = props.iter().take(iter_count).map(|p| p.totalSize).max().unwrap();
unsafe { *bytes = max_mem as usize };
l0::ze_result_t::ZE_RESULT_SUCCESS
}
} }
#[no_mangle] #[no_mangle]
pub extern "C" fn cuDriverGetVersion(version: &mut c_int) -> cu::Result { pub unsafe extern "C" fn cuDriverGetVersion(version: *mut c_int) -> cu::Result {
if version == ptr::null_mut() {
return cu::Result::ERROR_INVALID_VALUE;
}
*version = i32::max_value(); *version = i32::max_value();
return cu::Result::SUCCESS; return cu::Result::SUCCESS;
} }
#[no_mangle] #[no_mangle]
pub unsafe extern "C" fn cuInit(_: *const c_int) -> cu::Result { pub unsafe extern "C" fn cuInit(_: c_uint) -> cu::Result {
let l0_init = l0::zeInit(l0::ze_init_flag_t::ZE_INIT_FLAG_GPU_ONLY); let l0_init = l0::zeInit(l0::ze_init_flag_t::ZE_INIT_FLAG_GPU_ONLY);
if l0_init != l0::ze_result_t::ZE_RESULT_SUCCESS { if l0_init != l0::ze_result_t::ZE_RESULT_SUCCESS {
return cu::Result::from_l0(l0_init); return cu::Result::from_l0(l0_init);
}; }
let mut lock = GLOBAL_STATE.try_lock(); let mut lock = GLOBAL_STATE.try_lock();
if let Ok(ref mut mutex) = lock { if let Ok(ref mut mutex) = lock {
if let None = **mutex { if let None = **mutex {
@ -120,15 +154,34 @@ pub unsafe extern "C" fn cuInit(_: *const c_int) -> cu::Result {
#[no_mangle] #[no_mangle]
pub extern "C" fn cuDeviceGetCount(count: *mut c_int) -> cu::Result { pub extern "C" fn cuDeviceGetCount(count: *mut c_int) -> cu::Result {
if count == ptr::null_mut() {
return cu::Result::ERROR_INVALID_VALUE;
}
Driver::call(|driver| driver.device_get_count(count)) Driver::call(|driver| driver.device_get_count(count))
} }
#[no_mangle] #[no_mangle]
pub extern "C" fn cuDeviceGet(device: *mut cu::Device, ordinal: c_int) -> cu::Result { pub extern "C" fn cuDeviceGet(device: *mut cu::Device, ordinal: c_int) -> cu::Result {
if ordinal < 0 || device == ptr::null_mut() {
return cu::Result::ERROR_INVALID_VALUE;
}
Driver::call(|driver| driver.device_get(device, ordinal)) Driver::call(|driver| driver.device_get(device, ordinal))
} }
#[no_mangle] #[no_mangle]
pub extern "C" fn cuDeviceGetName(name: *mut c_char, len: c_int, dev: cu::Device) -> cu::Result { pub extern "C" fn cuDeviceGetName(name: *mut c_char, len: c_int, dev: cu::Device) -> cu::Result {
let cu::Device(dev_idx) = dev;
if len <= 0 || dev_idx < 0 || name == ptr::null_mut() {
return cu::Result::ERROR_INVALID_VALUE;
}
Driver::call(|driver| driver.device_get_name(name, len, dev)) Driver::call(|driver| driver.device_get_name(name, len, dev))
}
#[no_mangle]
pub extern "C" fn cuDeviceTotalMem_v2(bytes: *mut usize, dev: cu::Device) -> cu::Result {
let cu::Device(dev_idx) = dev;
if dev_idx < 0 || bytes == ptr::null_mut() {
return cu::Result::ERROR_INVALID_VALUE;
}
Driver::call(|driver| driver.device_total_mem(bytes, dev))
} }

38
notcuda/src/ze.rs Normal file
View File

@ -0,0 +1,38 @@
use level_zero_sys::*;
pub trait Versioned : Sized {
type Version;
fn new() -> Self {
let mut result = unsafe { std::mem::zeroed::<Self>() };
let ver = result.version();
*ver = Self::current();
return result;
}
fn current() -> Self::Version;
fn version(&mut self) -> &mut Self::Version;
}
impl Versioned for ze_device_memory_properties_t {
type Version = ze_device_memory_properties_version_t;
fn current() -> Self::Version {
ze_device_memory_properties_version_t::ZE_DEVICE_MEMORY_PROPERTIES_VERSION_CURRENT
}
fn version(&mut self) -> &mut Self::Version {
&mut self.version
}
}
impl Versioned for ze_device_properties_t {
type Version = ze_device_properties_version_t;
fn current() -> Self::Version {
ze_device_properties_version_t::ZE_DEVICE_PROPERTIES_VERSION_CURRENT
}
fn version(&mut self) -> &mut Self::Version {
&mut self.version
}
}