arrayfire
diff --git a/‎.github/workflows/ci.yml
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/ci.yml
Lines changed: 2 additions & 2 deletions
diff --git a/‎Cargo.toml
Lines changed: 4 additions & 0 deletions b/‎Cargo.toml
Lines changed: 4 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎cuda-interop/Cargo.toml
Lines changed: 1 addition & 1 deletion b/‎cuda-interop/Cargo.toml
Lines changed: 1 addition & 1 deletion
diff --git a/‎cuda-interop/examples/cuda_af_app.rs
Lines changed: 0 additions & 1 deletion b/‎cuda-interop/examples/cuda_af_app.rs
Lines changed: 0 additions & 1 deletion
diff --git a/‎examples/helloworld.rs
Lines changed: 3 additions & 3 deletions b/‎examples/helloworld.rs
Lines changed: 3 additions & 3 deletions
diff --git a/‎opencl-interop/Cargo.toml
Lines changed: 1 addition & 1 deletion b/‎opencl-interop/Cargo.toml
Lines changed: 1 addition & 1 deletion
diff --git a/‎opencl-interop/examples/custom_kernel.rs
Lines changed: 1 addition & 1 deletion b/‎opencl-interop/examples/custom_kernel.rs
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/algorithm/mod.rs
Lines changed: 115 additions & 25 deletions b/‎src/algorithm/mod.rs
Lines changed: 115 additions & 25 deletions
@@ -48,8 +48,8 @@ jobs:
                   export AF_PATH=${GITHUB_WORKSPACE}/afbin
                   export LD_LIBRARY_PATH=${LD_LIBRARY_PATH}:${AF_PATH}/lib64
                   echo "Using cargo version: $(cargo --version)"
-                  cargo build --all
-                  cargo test --no-fail-fast
+                  cargo build --all --all-features
+                  cargo test --no-fail-fast --all-features
 
     format:
         name: Format Check
 
@@ -46,15 +46,19 @@ statistics = []
 vision = []
 default = ["algorithm", "arithmetic", "blas", "data", "indexing", "graphics", "image", "lapack",
 "ml", "macros", "random", "signal", "sparse", "statistics", "vision"]
+afserde = ["serde"]
 
 [dependencies]
 libc = "0.2"
 num  = "0.2"
 lazy_static = "1.0"
 half = "1.5.0"
+serde = { version = "1.0", features = ["derive"], optional = true }
 
 [dev-dependencies]
 half = "1.5.0"
+serde_json = "1.0"
+bincode = "1.3"
 
 [build-dependencies]
 serde_json = "1.0"
 
@@ -16,7 +16,7 @@ Only, Major(M) & Minor(m) version numbers need to match. *p1* and *p2* are patch
 
 ## Supported platforms
 
-Linux, Windows and OSX. Rust 1.15.1 or higher is required.
+Linux, Windows and OSX. Rust 1.31 or newer is required.
 
 ## Use from Crates.io [![][6]][7] [![][8]][9]
 
 
@@ -19,7 +19,7 @@ rustacuda = "0.1"
 rustacuda_core = "0.1"
 
 [[example]]
-name = "custom_kernel"
+name = "afcuda_custom_kernel"
 path = "examples/custom_kernel.rs"
 
 [[example]]
 
@@ -1,6 +1,5 @@
 use arrayfire::{af_print, dim4, info, set_device, Array};
 use rustacuda::prelude::*;
-use rustacuda::*;
 
 fn main() {
     // MAKE SURE to do all rustacuda initilization before arrayfire API's
 
@@ -13,14 +13,14 @@ fn main() {
     );
     println!("Revision: {}", get_revision());
 
-    let num_rows: u64 = 5;
-    let num_cols: u64 = 3;
+    let num_rows: i64 = 5;
+    let num_cols: i64 = 3;
     let values: [f32; 3] = [1.0, 2.0, 3.0];
     let indices = Array::new(&values, Dim4::new(&[3, 1, 1, 1]));
 
     af_print!("Indices ", indices);
 
-    let dims = Dim4::new(&[num_rows, num_cols, 1, 1]);
+    let dims = Dim4::new(&[num_rows as u64, num_cols as u64, 1, 1]);
 
     let mut a = randu::<f32>(dims);
     af_print!("Create a 5-by-3 float   matrix on the GPU", a);
 
@@ -18,7 +18,7 @@ cl-sys = "0.4.2"
 ocl-core = "0.11.2"
 
 [[example]]
-name = "custom_kernel"
+name = "afocl_custom_kernel"
 path = "examples/custom_kernel.rs"
 
 [[example]]
 
@@ -22,7 +22,7 @@ fn main() {
     let af_ctx = afcl::get_context(false);
     let af_que = afcl::get_queue(false);
 
-    let devid = unsafe { ocl_core::DeviceId::from_raw(af_did) };
+    let _devid = unsafe { ocl_core::DeviceId::from_raw(af_did) };
     let contx = unsafe { ocl_core::Context::from_raw_copied_ptr(af_ctx) };
     let queue = unsafe { ocl_core::CommandQueue::from_raw_copied_ptr(af_que) };
 
 
@@ -518,12 +518,17 @@ where
 }
 
 macro_rules! all_reduce_func_def {
-    ($doc_str: expr, $fn_name: ident, $ffi_name: ident, $out_type:ty) => {
+    ($doc_str: expr, $fn_name: ident, $ffi_name: ident, $assoc_type:ident) => {
         #[doc=$doc_str]
-        pub fn $fn_name<T>(input: &Array<T>) -> ($out_type, $out_type)
+        pub fn $fn_name<T>(input: &Array<T>)
+            -> (
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType,
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType
+               )
         where
             T: HasAfEnum,
-            $out_type: HasAfEnum + Fromf64
+            <T as HasAfEnum>::$assoc_type: HasAfEnum,
+            <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType: HasAfEnum + Fromf64,
         {
             let mut real: f64 = 0.0;
             let mut imag: f64 = 0.0;
@@ -533,7 +538,10 @@ macro_rules! all_reduce_func_def {
                 );
                 HANDLE_ERROR(AfError::from(err_val));
             }
-            (<$out_type>::fromf64(real), <$out_type>::fromf64(imag))
+            (
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType::fromf64(real),
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType::fromf64(imag),
+            )
         }
     };
 }
@@ -564,7 +572,7 @@ all_reduce_func_def!(
     ",
     sum_all,
     af_sum_all,
-    T::AggregateOutType
+    AggregateOutType
 );
 
 all_reduce_func_def!(
@@ -594,7 +602,7 @@ all_reduce_func_def!(
     ",
     product_all,
     af_product_all,
-    T::ProductOutType
+    ProductOutType
 );
 
 all_reduce_func_def!(
@@ -623,7 +631,7 @@ all_reduce_func_def!(
     ",
     min_all,
     af_min_all,
-    T::InType
+    InType
 );
 
 all_reduce_func_def!(
@@ -652,10 +660,31 @@ all_reduce_func_def!(
     ",
     max_all,
     af_max_all,
-    T::InType
+    InType
 );
 
-all_reduce_func_def!(
+macro_rules! all_reduce_func_def2 {
+    ($doc_str: expr, $fn_name: ident, $ffi_name: ident, $out_type:ty) => {
+        #[doc=$doc_str]
+        pub fn $fn_name<T>(input: &Array<T>) -> ($out_type, $out_type)
+        where
+            T: HasAfEnum,
+            $out_type: HasAfEnum + Fromf64
+        {
+            let mut real: f64 = 0.0;
+            let mut imag: f64 = 0.0;
+            unsafe {
+                let err_val = $ffi_name(
+                    &mut real as *mut c_double, &mut imag as *mut c_double, input.get(),
+                );
+                HANDLE_ERROR(AfError::from(err_val));
+            }
+            (<$out_type>::fromf64(real), <$out_type>::fromf64(imag))
+        }
+    };
+}
+
+all_reduce_func_def2!(
     "
     Find if all values of Array are non-zero
 
@@ -682,7 +711,7 @@ all_reduce_func_def!(
     bool
 );
 
-all_reduce_func_def!(
+all_reduce_func_def2!(
     "
     Find if any value of Array is non-zero
 
@@ -709,7 +738,7 @@ all_reduce_func_def!(
     bool
 );
 
-all_reduce_func_def!(
+all_reduce_func_def2!(
     "
     Count number of non-zero values in the Array
 
@@ -751,10 +780,17 @@ all_reduce_func_def!(
 /// A tuple of summation result.
 ///
 /// Note: For non-complex data type Arrays, second value of tuple is zero.
-pub fn sum_nan_all<T>(input: &Array<T>, val: f64) -> (T::AggregateOutType, T::AggregateOutType)
+pub fn sum_nan_all<T>(
+    input: &Array<T>,
+    val: f64,
+) -> (
+    <<T as HasAfEnum>::AggregateOutType as HasAfEnum>::BaseType,
+    <<T as HasAfEnum>::AggregateOutType as HasAfEnum>::BaseType,
+)
 where
     T: HasAfEnum,
-    T::AggregateOutType: HasAfEnum + Fromf64,
+    <T as HasAfEnum>::AggregateOutType: HasAfEnum,
+    <<T as HasAfEnum>::AggregateOutType as HasAfEnum>::BaseType: HasAfEnum + Fromf64,
 {
     let mut real: f64 = 0.0;
     let mut imag: f64 = 0.0;
@@ -768,8 +804,8 @@ where
         HANDLE_ERROR(AfError::from(err_val));
     }
     (
-        <T::AggregateOutType>::fromf64(real),
-        <T::AggregateOutType>::fromf64(imag),
+        <<T as HasAfEnum>::AggregateOutType as HasAfEnum>::BaseType::fromf64(real),
+        <<T as HasAfEnum>::AggregateOutType as HasAfEnum>::BaseType::fromf64(imag),
     )
 }
 
@@ -788,10 +824,17 @@ where
 /// A tuple of product result.
 ///
 /// Note: For non-complex data type Arrays, second value of tuple is zero.
-pub fn product_nan_all<T>(input: &Array<T>, val: f64) -> (T::ProductOutType, T::ProductOutType)
+pub fn product_nan_all<T>(
+    input: &Array<T>,
+    val: f64,
+) -> (
+    <<T as HasAfEnum>::ProductOutType as HasAfEnum>::BaseType,
+    <<T as HasAfEnum>::ProductOutType as HasAfEnum>::BaseType,
+)
 where
     T: HasAfEnum,
-    T::ProductOutType: HasAfEnum + Fromf64,
+    <T as HasAfEnum>::ProductOutType: HasAfEnum,
+    <<T as HasAfEnum>::ProductOutType as HasAfEnum>::BaseType: HasAfEnum + Fromf64,
 {
     let mut real: f64 = 0.0;
     let mut imag: f64 = 0.0;
@@ -805,8 +848,8 @@ where
         HANDLE_ERROR(AfError::from(err_val));
     }
     (
-        <T::ProductOutType>::fromf64(real),
-        <T::ProductOutType>::fromf64(imag),
+        <<T as HasAfEnum>::ProductOutType as HasAfEnum>::BaseType::fromf64(real),
+        <<T as HasAfEnum>::ProductOutType as HasAfEnum>::BaseType::fromf64(imag),
     )
 }
 
@@ -858,12 +901,18 @@ dim_ireduce_func_def!("
     ", imax, af_imax, InType);
 
 macro_rules! all_ireduce_func_def {
-    ($doc_str: expr, $fn_name: ident, $ffi_name: ident, $out_type:ty) => {
+    ($doc_str: expr, $fn_name: ident, $ffi_name: ident, $assoc_type:ident) => {
         #[doc=$doc_str]
-        pub fn $fn_name<T>(input: &Array<T>) -> ($out_type, $out_type, u32)
+        pub fn $fn_name<T>(input: &Array<T>)
+            -> (
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType,
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType,
+                u32
+               )
         where
             T: HasAfEnum,
-            $out_type: HasAfEnum + Fromf64
+            <T as HasAfEnum>::$assoc_type: HasAfEnum,
+            <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType: HasAfEnum + Fromf64,
         {
             let mut real: f64 = 0.0;
             let mut imag: f64 = 0.0;
@@ -875,7 +924,11 @@ macro_rules! all_ireduce_func_def {
                 );
                 HANDLE_ERROR(AfError::from(err_val));
             }
-            (<$out_type>::fromf64(real), <$out_type>::fromf64(imag), temp)
+            (
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType::fromf64(real),
+                <<T as HasAfEnum>::$assoc_type as HasAfEnum>::BaseType::fromf64(imag),
+                temp,
+            )
         }
     };
 }
@@ -898,7 +951,7 @@ all_ireduce_func_def!(
     ",
     imin_all,
     af_imin_all,
-    T::InType
+    InType
 );
 all_ireduce_func_def!(
     "
@@ -918,7 +971,7 @@ all_ireduce_func_def!(
     ",
     imax_all,
     af_imax_all,
-    T::InType
+    InType
 );
 
 /// Locate the indices of non-zero elements.
@@ -1386,3 +1439,40 @@ dim_reduce_by_key_nan_func_def!(
     af_product_by_key_nan,
     ValueType::ProductOutType
 );
+
+#[cfg(test)]
+mod tests {
+    use super::super::core::c32;
+    use super::{imax_all, imin_all, product_nan_all, sum_all, sum_nan_all};
+    use crate::randu;
+
+    #[test]
+    fn all_reduce_api() {
+        let a = randu!(c32; 10, 10);
+        println!("Reduction of complex f32 matrix: {:?}", sum_all(&a));
+
+        let b = randu!(bool; 10, 10);
+        println!("reduction of bool matrix: {:?}", sum_all(&b));
+
+        println!(
+            "reduction of complex f32 matrix after replacing nan with {}: {:?}",
+            1.0,
+            product_nan_all(&a, 1.0)
+        );
+
+        println!(
+            "reduction of bool matrix after replacing nan with {}: {:?}",
+            0.0,
+            sum_nan_all(&b, 0.0)
+        );
+    }
+
+    #[test]
+    fn all_ireduce_api() {
+        let a = randu!(c32; 10);
+        println!("Reduction of complex f32 matrix: {:?}", imin_all(&a));
+
+        let b = randu!(u32; 10);
+        println!("reduction of bool matrix: {:?}", imax_all(&b));
+    }
+}