arrayfire/src/api/c/assign.cpp at v3.8 · feiyunwill/arrayfire

402 lines (356 loc) · 14.7 KB
/*******************************************************
 * Copyright (c) 2014, ArrayFire
 * All rights reserved.
 * This file is distributed under 3-clause BSD license.
 * The complete license agreement can be obtained at:
 * http://arrayfire.com/licenses/BSD-3-Clause
 ********************************************************/
#include <assign.hpp>
#include <Array.hpp>
#include <backend.hpp>
#include <common/ArrayInfo.hpp>
#include <common/complex.hpp>
#include <common/err_common.hpp>
#include <common/half.hpp>
#include <copy.hpp>
#include <handle.hpp>
#include <indexing_common.hpp>
#include <math.hpp>
#include <tile.hpp>
#include <af/data.h>
#include <af/defines.h>
#include <af/dim4.hpp>
#include <af/index.h>
using std::signbit;
using std::swap;
using std::vector;
using af::dim4;
using common::convert2Canonical;
using common::createSpanIndex;
using common::half;
using common::if_complex;
using common::if_real;
using detail::Array;
using detail::cdouble;
using detail::cfloat;
using detail::createSubArray;
using detail::intl;
using detail::uchar;
using detail::uint;
using detail::uintl;
using detail::ushort;
template<typename Tout, typename Tin>
static void assign(Array<Tout>& out, const vector<af_seq> seqs,
                   const Array<Tin>& in) {
    size_t ndims      = seqs.size();
    const dim4& outDs = out.dims();
    const dim4& iDims = in.dims();
    if (iDims.elements() == 0) { return; }
    out.eval();
    dim4 oDims = toDims(seqs, outDs);
    bool isVec = true;
    for (int i = 0; isVec && i < static_cast<int>(oDims.ndims()) - 1; i++) {
        isVec &= oDims[i] == 1;
    isVec &= in.isVector() || in.isScalar();
    for (auto i = static_cast<dim_t>(ndims); i < in.ndims(); i++) {
        oDims[i] = 1;
    if (isVec) {
        if (oDims.elements() != in.elements() && in.elements() != 1) {
            AF_ERROR("Size mismatch between input and output", AF_ERR_SIZE);
        // If both out and in are vectors of equal elements,
        // reshape in to out dims
        Array<Tin> in_ =
            in.elements() == 1 ? tile(in, oDims) : modDims(in, oDims);
        auto dst = createSubArray<Tout>(out, seqs, false);
        copyArray<Tin, Tout>(dst, in_);
    } else {
        for (int i = 0; i < AF_MAX_DIMS; i++) {
            if (oDims[i] != iDims[i]) {
                AF_ERROR("Size mismatch between input and output", AF_ERR_SIZE);
        Array<Tout> dst = createSubArray<Tout>(out, seqs, false);
        copyArray<Tin, Tout>(dst, in);
template<typename T>
static if_complex<T> assign(Array<T>& out, const vector<af_seq> iv,
                            const af_array& in) {
    const ArrayInfo& iInfo = getInfo(in);
    af_dtype iType         = iInfo.getType();
    switch (iType) {
        case c64: assign<T, cdouble>(out, iv, getArray<cdouble>(in)); break;
        case c32: assign<T, cfloat>(out, iv, getArray<cfloat>(in)); break;
        default: TYPE_ERROR(1, iType); break;
template<typename T>
static if_real<T> assign(Array<T>& out, const vector<af_seq> iv,
                         const af_array& in) {
    const ArrayInfo& iInfo = getInfo(in);
    af_dtype iType         = iInfo.getType();
    switch (iType) {
        case f64: assign<T, double>(out, iv, getArray<double>(in)); break;
        case f32: assign<T, float>(out, iv, getArray<float>(in)); break;
        case s32: assign<T, int>(out, iv, getArray<int>(in)); break;
        case u32: assign<T, uint>(out, iv, getArray<uint>(in)); break;
        case s64: assign<T, intl>(out, iv, getArray<intl>(in)); break;
        case u64: assign<T, uintl>(out, iv, getArray<uintl>(in)); break;
        case s16: assign<T, short>(out, iv, getArray<short>(in)); break;
        case u16: assign<T, ushort>(out, iv, getArray<ushort>(in)); break;
        case u8: assign<T, uchar>(out, iv, getArray<uchar>(in)); break;
        case b8: assign<T, char>(out, iv, getArray<char>(in)); break;
        case f16: assign<T, half>(out, iv, getArray<half>(in)); break;
        default: TYPE_ERROR(1, iType); break;
af_err af_assign_seq(af_array* out, const af_array lhs, const unsigned ndims,
                     const af_seq* index, const af_array rhs) {
        ARG_ASSERT(2, (ndims > 0 && ndims <= AF_MAX_DIMS));
        ARG_ASSERT(1, (lhs != 0));
        ARG_ASSERT(4, (rhs != 0));
        const ArrayInfo& lInfo = getInfo(lhs);
        if (ndims == 1 && ndims != lInfo.ndims()) {
            af_array tmp_in;
            af_array tmp_out;
            AF_CHECK(af_flat(&tmp_in, lhs));
            AF_CHECK(af_assign_seq(&tmp_out, tmp_in, ndims, index, rhs));
            AF_CHECK(
                af_moddims(out, tmp_out, lInfo.ndims(), lInfo.dims().get()));
            AF_CHECK(af_release_array(tmp_in));
            // This can run into a double free issue if tmp_in == tmp_out
            // The condition ensures release only if both are different
            // Issue found on Tegra X1
            if (tmp_in != tmp_out) { AF_CHECK(af_release_array(tmp_out)); }
            return AF_SUCCESS;
        af_array res = 0;
        if (*out != lhs) {
            int count = 0;
            AF_CHECK(af_get_data_ref_count(&count, lhs));
            if (count > 1) {
                AF_CHECK(af_copy_array(&res, lhs));
            } else {
                res = retain(lhs);
        } else {
            res = lhs;
        try {
            if (lhs != rhs) {
                const dim4& outDims = getInfo(res).dims();
                const dim4& inDims  = getInfo(rhs).dims();
                vector<af_seq> inSeqs(ndims, af_span);
                for (unsigned i = 0; i < ndims; ++i) {
                    inSeqs[i] = convert2Canonical(index[i], outDims[i]);
                    ARG_ASSERT(3,
                               (inSeqs[i].begin >= 0. || inSeqs[i].end >= 0.));
                    if (signbit(inSeqs[i].step)) {
                        ARG_ASSERT(3, inSeqs[i].begin >= inSeqs[i].end);
                    } else {
                        ARG_ASSERT(3, inSeqs[i].begin <= inSeqs[i].end);
                DIM_ASSERT(0, (outDims.ndims() >= inDims.ndims()));
                DIM_ASSERT(0, (outDims.ndims() >= (dim_t)ndims));
                const ArrayInfo& oInfo = getInfo(res);
                af_dtype oType         = oInfo.getType();
                switch (oType) {
                    case c64:
                        assign(getArray<cdouble>(res), inSeqs, rhs);
                    case c32: assign(getArray<cfloat>(res), inSeqs, rhs); break;
                    case f64: assign(getArray<double>(res), inSeqs, rhs); break;
                    case f32: assign(getArray<float>(res), inSeqs, rhs); break;
                    case s32: assign(getArray<int>(res), inSeqs, rhs); break;
                    case u32: assign(getArray<uint>(res), inSeqs, rhs); break;
                    case s64: assign(getArray<intl>(res), inSeqs, rhs); break;
                    case u64: assign(getArray<uintl>(res), inSeqs, rhs); break;
                    case s16: assign(getArray<short>(res), inSeqs, rhs); break;
                    case u16: assign(getArray<ushort>(res), inSeqs, rhs); break;
                    case u8: assign(getArray<uchar>(res), inSeqs, rhs); break;
                    case b8: assign(getArray<char>(res), inSeqs, rhs); break;
                    case f16: assign(getArray<half>(res), inSeqs, rhs); break;
                    default: TYPE_ERROR(1, oType); break;
        } catch (...) {
            af_release_array(res);
            throw;
        swap(*out, res);
    CATCHALL;
    return AF_SUCCESS;
template<typename T>
inline void genAssign(af_array& out, const af_index_t* indexs,
                      const af_array& rhs) {
    detail::assign<T>(getArray<T>(out), indexs, getArray<T>(rhs));
af_err af_assign_gen(af_array* out, const af_array lhs, const dim_t ndims,
                     const af_index_t* indexs, const af_array rhs_) {
        ARG_ASSERT(2, (ndims > 0 && ndims <= AF_MAX_DIMS));
        ARG_ASSERT(3, (indexs != NULL));
        int track = 0;
        vector<af_seq> seqs(AF_MAX_DIMS, af_span);
        for (dim_t i = 0; i < ndims; i++) {
            if (indexs[i].isSeq) {
                track++;
                seqs[i] = indexs[i].idx.seq;
        af_array rhs = rhs_;
        if (track == static_cast<int>(ndims)) {
            // all indexs are sequences, redirecting to af_assign
            return af_assign_seq(out, lhs, ndims, seqs.data(), rhs);
        ARG_ASSERT(1, (lhs != 0));
        ARG_ASSERT(4, (rhs != 0));
        const ArrayInfo& lInfo = getInfo(lhs);
        const ArrayInfo& rInfo = getInfo(rhs);
        const dim4& lhsDims    = lInfo.dims();
        const dim4& rhsDims    = rInfo.dims();
        af_dtype lhsType       = lInfo.getType();
        af_dtype rhsType       = rInfo.getType();
        if (rhsDims.ndims() == 0) { return af_retain_array(out, lhs); }
        if (lhsDims.ndims() == 0) {
            return af_create_handle(out, 0, nullptr, lhsType);
        ARG_ASSERT(2, (ndims == 1) || (ndims == (dim_t)lInfo.ndims()));
        if (ndims == 1 && ndims != static_cast<dim_t>(lInfo.ndims())) {
            af_array tmp_in  = 0;
            af_array tmp_out = 0;
            AF_CHECK(af_flat(&tmp_in, lhs));
            AF_CHECK(af_assign_gen(&tmp_out, tmp_in, ndims, indexs, rhs_));
            AF_CHECK(
                af_moddims(out, tmp_out, lInfo.ndims(), lInfo.dims().get()));
            AF_CHECK(af_release_array(tmp_in));
            // This can run into a double free issue if tmp_in == tmp_out
            // The condition ensures release only if both are different
            // Issue found on Tegra X1
            if (tmp_in != tmp_out) { AF_CHECK(af_release_array(tmp_out)); }
            return AF_SUCCESS;
        ARG_ASSERT(1, (lhsType == rhsType));
        ARG_ASSERT(1, (lhsDims.ndims() >= rhsDims.ndims()));
        ARG_ASSERT(2, (lhsDims.ndims() >= ndims));
        af_array output = 0;
        if (*out != lhs) {
            int count = 0;
            AF_CHECK(af_get_data_ref_count(&count, lhs));
            if (count > 1) {
                AF_CHECK(af_copy_array(&output, lhs));
            } else {
                output = retain(lhs);
        } else {
            output = lhs;
        dim4 oDims = toDims(seqs, lhsDims);
        // if af_array are indexs along any
        // particular dimension, set the length of
        // that dimension accordingly before any checks
        for (dim_t i = 0; i < ndims; i++) {
            if (!indexs[i].isSeq) {
                oDims[i] = getInfo(indexs[i].idx.arr).elements();
        for (dim_t i = ndims; i < static_cast<dim_t>(lInfo.ndims()); i++) {
            oDims[i] = 1;
        bool isVec = true;
        for (int i = 0; isVec && i < oDims.ndims() - 1; i++) {
            isVec &= oDims[i] == 1;
        // TODO(umar): Move logic out of this
        isVec &= rInfo.isVector() || rInfo.isScalar();
        if (isVec) {
            if (oDims.elements() != static_cast<dim_t>(rInfo.elements()) &&
                rInfo.elements() != 1) {
                AF_ERROR("Size mismatch between input and output", AF_ERR_SIZE);
            if (rInfo.elements() == 1) {
                AF_CHECK(af_tile(&rhs, rhs_, oDims[0], oDims[1], oDims[2],
                                 oDims[3]));
            } else {
                // If both out and rhs are vectors of equal
                // elements, reshape rhs to out dims
                AF_CHECK(af_moddims(&rhs, rhs_, oDims.ndims(), oDims.get()));
        } else {
            for (int i = 0; i < AF_MAX_DIMS; i++) {
                if (oDims[i] != rhsDims[i]) {
                    AF_ERROR("Size mismatch between input and output",
                             AF_ERR_SIZE);
        std::array<af_index_t, AF_MAX_DIMS> idxrs{};
        for (dim_t i = 0; i < AF_MAX_DIMS; ++i) {
            if (i < ndims) {
                bool isSeq = indexs[i].isSeq;
                if (!isSeq) {
                    // check if all af_arrays have atleast one value
                    // to enable indexing along that dimension
                    const ArrayInfo& idxInfo = getInfo(indexs[i].idx.arr);
                    af_dtype idxType         = idxInfo.getType();
                    ARG_ASSERT(3, (idxType != c32));
                    ARG_ASSERT(3, (idxType != c64));
                    ARG_ASSERT(3, (idxType != b8));
                    idxrs[i] = {{indexs[i].idx.arr}, isSeq, indexs[i].isBatch};
                } else {
                    af_seq inSeq =
                        convert2Canonical(indexs[i].idx.seq, lhsDims[i]);
                    ARG_ASSERT(3, (inSeq.begin >= 0 || inSeq.end >= 0));
                    if (signbit(inSeq.step)) {
                        ARG_ASSERT(3, inSeq.begin >= inSeq.end);
                    } else {
                        ARG_ASSERT(3, inSeq.begin <= inSeq.end);
                    idxrs[i].idx.seq = inSeq;
                    idxrs[i].isSeq   = isSeq;
                    idxrs[i].isBatch = indexs[i].isBatch;
            } else {
                // set all dimensions above ndims to spanner
                idxrs[i] = createSpanIndex();
        af_index_t* ptr = idxrs.data();
        try {
            switch (rhsType) {
                case c64: genAssign<cdouble>(output, ptr, rhs); break;
                case f64: genAssign<double>(output, ptr, rhs); break;
                case c32: genAssign<cfloat>(output, ptr, rhs); break;
                case f32: genAssign<float>(output, ptr, rhs); break;
                case u64: genAssign<uintl>(output, ptr, rhs); break;
                case u32: genAssign<uint>(output, ptr, rhs); break;
                case s64: genAssign<intl>(output, ptr, rhs); break;
                case s32: genAssign<int>(output, ptr, rhs); break;
                case s16: genAssign<short>(output, ptr, rhs); break;
                case u16: genAssign<ushort>(output, ptr, rhs); break;
                case u8: genAssign<uchar>(output, ptr, rhs); break;
                case b8: genAssign<char>(output, ptr, rhs); break;
                case f16: genAssign<half>(output, ptr, rhs); break;
                default: TYPE_ERROR(1, rhsType);
        } catch (...) {
            if (*out != lhs) {
                AF_CHECK(af_release_array(output));
                if (isVec) { AF_CHECK(af_release_array(rhs)); }
            throw;
        if (isVec) { AF_CHECK(af_release_array(rhs)); }
        swap(*out, output);
    CATCHALL;
    return AF_SUCCESS;
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

assign.cpp

Latest commit

History

assign.cpp

File metadata and controls