Skip to content

adding the MPS version of running_compute_processes for >= Volta. #112

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 1 commit into
base: main
Choose a base branch
from
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
63 changes: 63 additions & 0 deletions nvml-wrapper/src/device.rs
Original file line number Diff line number Diff line change
Expand Up @@ -624,6 +624,63 @@ impl<'nvml> Device<'nvml> {
}
}

fn mps_running_compute_processes_count(&self) -> Result<c_uint, NvmlError> {
let sym = nvml_sym(
self.nvml
.lib
.nvmlDeviceGetMPSComputeRunningProcesses_v3
.as_ref(),
)?;

unsafe {
let mut len: c_uint = 0;

match sym(self.device, &mut len, ptr::null_mut()) {
nvmlReturn_enum_NVML_ERROR_INSUFFICIENT_SIZE => Ok(len),
another_attempt => nvml_try(another_attempt).map(|_| 0),
}
}
}

/**
Gets information about processes with a compute context running on this `Device`.
Note that processes list can differ between the accounting call and the list gathering

# Errors

* `Uninitialized`, if the library has not been successfully initialized
* `InvalidArg`, if this `Device` is invalid
* `GpuLost`, if this `Device` has fallen off the bus or is otherwise inaccessible
* `Unknown`, on any unexpected error

# Device Support

Supports Volta or newer fully supported devices.
*/
#[doc(alias = "nvmlDeviceGetMPSComputeRunningProcesses_v3")]
pub fn mps_running_compute_processes(&self) -> Result<Vec<ProcessInfo>, NvmlError> {
let sym = nvml_sym(
self.nvml
.lib
.nvmlDeviceGetMPSComputeRunningProcesses_v3
.as_ref(),
)?;

unsafe {
let mut len: c_uint = match self.mps_running_compute_processes_count()? {
0 => return Ok(vec![]),
value => value,
};

let mut processes: Vec<nvmlProcessInfo_t> = Vec::with_capacity(len as usize);

nvml_try(sym(self.device, &mut len, processes.as_mut_ptr()))?;

processes.set_len(len as usize);
Ok(processes.into_iter().map(ProcessInfo::from).collect())
}
}

/**
Gets the number of processes with a compute context running on this `Device`.

Expand Down Expand Up @@ -6633,6 +6690,12 @@ mod test {
test_with_device(3, &nvml, |device| device.running_compute_processes_v2())
}

#[test]
fn mps_running_compute_processes() {
let nvml = nvml();
test_with_device(3, &nvml, |device| device.mps_running_compute_processes())
}

#[cfg(target_os = "linux")]
#[test]
fn cpu_affinity() {
Expand Down
Loading