BUGFIX: Add support for broadcasting weights when using mean.

pavanky · pavanky · commit 0a675e87f424 · 2017-09-17T23:46:40.000-07:00
diff --git a/src/api/c/mean.cpp b/src/api/c/mean.cpp
@@ -8,6 +8,7 @@
  ********************************************************/
 
 #include <af/dim4.hpp>
+#include <af/data.h>
 #include <af/statistics.h>
 #include <af/defines.h>
 #include <err_common.hpp>
@@ -91,23 +92,39 @@ af_err af_mean_weighted(af_array *out, const af_array in, const af_array weights
         af_dtype wType  = wInfo.getType();
 
         ARG_ASSERT(2, (wType==f32 || wType==f64)); /* verify that weights are non-complex real numbers */
-        ARG_ASSERT(2, iInfo.dims() == wInfo.dims());
+
+        //FIXME: We should avoid additional copies
+        af_array w = weights;
+        if (iInfo.dims() != wInfo.dims()) {
+            dim4 iDims = iInfo.dims();
+            dim4 wDims = wInfo.dims();
+            dim4 tDims(1,1,1,1);
+            for (int i = 0; i < 4; i++) {
+                ARG_ASSERT(2, wDims[i] == 1 || wDims[i] == iDims[i]);
+                tDims[i] = iDims[i] / wDims[i];
+            }
+            AF_CHECK(af_tile(&w, weights, tDims[0], tDims[1], tDims[2], tDims[3]));
+        }
 
         switch(iType) {
-            case f64: output = mean< double>(in, weights, dim); break;
-            case f32: output = mean< float >(in, weights, dim); break;
-            case s32: output = mean< float >(in, weights, dim); break;
-            case u32: output = mean< float >(in, weights, dim); break;
-            case s64: output = mean< double>(in, weights, dim); break;
-            case u64: output = mean< double>(in, weights, dim); break;
-            case s16: output = mean< float >(in, weights, dim); break;
-            case u16: output = mean< float >(in, weights, dim); break;
-            case  u8: output = mean< float >(in, weights, dim); break;
-            case  b8: output = mean< float >(in, weights, dim); break;
-            case c32: output = mean< cfloat>(in, weights, dim); break;
-            case c64: output = mean<cdouble>(in, weights, dim); break;
+            case f64: output = mean< double>(in, w, dim); break;
+            case f32: output = mean< float >(in, w, dim); break;
+            case s32: output = mean< float >(in, w, dim); break;
+            case u32: output = mean< float >(in, w, dim); break;
+            case s64: output = mean< double>(in, w, dim); break;
+            case u64: output = mean< double>(in, w, dim); break;
+            case s16: output = mean< float >(in, w, dim); break;
+            case u16: output = mean< float >(in, w, dim); break;
+            case  u8: output = mean< float >(in, w, dim); break;
+            case  b8: output = mean< float >(in, w, dim); break;
+            case c32: output = mean< cfloat>(in, w, dim); break;
+            case c64: output = mean<cdouble>(in, w, dim); break;
             default : TYPE_ERROR(1, iType);
         }
+
+        if (w != weights) {
+            AF_CHECK(af_release_array(w));
+        }
         std::swap(*out, output);
     }
     CATCHALL;
diff --git a/test/mean.cpp b/test/mean.cpp
@@ -301,3 +301,23 @@ TYPED_TEST(WeightedMean, Basic)
 {
     weightedMeanAllTest<TypeParam, float>(af::dim4(32, 30, 33, 17));
 }
+
+TEST(WeightedMean, Broadacst)
+{
+    float val = 0.5f;
+    af::array a = af::randu(4096, 32);
+    af::array w = af::constant(val, a.dims());
+    af::array c = af::mean(a);
+    af::array d = af::mean(a, w);
+
+    std::vector<float> hc(c.elements());
+    std::vector<float> hd(d.elements());
+
+    c.host(hc.data());
+    d.host(hd.data());
+
+    for(size_t i = 0; i < hc.size(); i++) {
+        //C and D are the same because they are normalized by the sum of the weights.
+        ASSERT_NEAR(hc[i], hd[i], 1E-5);
+    }
+}