aboutsummaryrefslogtreecommitdiffhomepage
path: root/zluda/src
diff options
context:
space:
mode:
authorAndrzej Janik <[email protected]>2021-06-27 13:08:46 +0200
committerAndrzej Janik <[email protected]>2021-06-27 13:08:46 +0200
commitd7d38256e0580c3cfb649a641d9ed62c6ff0fc20 (patch)
tree886fc195af96df37075b4f7b5664bf755ef872ae /zluda/src
parentb2765370e5ba86f21f6c4758817b3464c52150e5 (diff)
downloadZLUDA-d7d38256e0580c3cfb649a641d9ed62c6ff0fc20.tar.gz
ZLUDA-d7d38256e0580c3cfb649a641d9ed62c6ff0fc20.zip
Fix offset calculation in kernel launch
Diffstat (limited to 'zluda/src')
-rw-r--r--zluda/src/impl/function.rs18
1 files changed, 10 insertions, 8 deletions
diff --git a/zluda/src/impl/function.rs b/zluda/src/impl/function.rs
index 4f2006c..638d08a 100644
--- a/zluda/src/impl/function.rs
+++ b/zluda/src/impl/function.rs
@@ -110,23 +110,24 @@ pub fn launch_kernel(
match (buffer_size, buffer_ptr) {
(Some(buffer_size), Some(buffer_ptr)) => {
let sum_of_kernel_argument_sizes =
- func.arg_size.iter().fold(0, |offset, size_of_arg| {
- size_of_arg + round_up_to_multiple(offset, *size_of_arg)
- });
+ func.arg_size
+ .iter()
+ .fold(0, |sum_of_arg_sizes, size_of_arg| {
+ sum_of_arg_sizes + align_to_usize(*size_of_arg)
+ });
if buffer_size != sum_of_kernel_argument_sizes {
return Err(CUresult::CUDA_ERROR_INVALID_VALUE);
}
let mut offset = 0;
for (i, arg_size) in func.arg_size.iter().enumerate() {
- let buffer_offset = round_up_to_multiple(offset, *arg_size);
unsafe {
func.base.set_arg_raw(
i as u32,
*arg_size,
- buffer_ptr.add(buffer_offset) as *const _,
+ buffer_ptr.add(offset) as *const _,
)?
};
- offset = buffer_offset + *arg_size;
+ offset += align_to_usize(*arg_size);
}
}
_ => return Err(CUresult::CUDA_ERROR_INVALID_VALUE),
@@ -159,8 +160,9 @@ pub fn launch_kernel(
})?
}
-fn round_up_to_multiple(x: usize, multiple: usize) -> usize {
- ((x + multiple - 1) / multiple) * multiple
+fn align_to_usize(value: usize) -> usize {
+ let multiple = std::mem::size_of::<usize>();
+ ((value + multiple - 1) / multiple) * multiple
}
pub(crate) fn get_attribute(