123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171 |
- // (c) Daniel Llorens - 2011-2014, 2016-2017
- // This library is free software; you can redistribute it and/or modify it under
- // the terms of the GNU Lesser General Public License as published by the Free
- // Software Foundation; either version 3 of the License, or (at your option) any
- // later version.
- /// @file expr.H
- /// @brief Operator nodes for expression templates.
- #pragma once
- #include "ra/ply.H"
- #ifdef RA_CHECK_BOUNDS
- #define RA_CHECK_BOUNDS_RA_EXPR RA_CHECK_BOUNDS
- #else
- #ifndef RA_CHECK_BOUNDS_RA_EXPR
- #define RA_CHECK_BOUNDS_RA_EXPR 1
- #endif
- #endif
- #if RA_CHECK_BOUNDS_RA_EXPR==0
- #define CHECK_BOUNDS( cond )
- #else
- #define CHECK_BOUNDS( cond ) assert( cond )
- #endif
- namespace ra {
- // Manipulate ET through flat (raw pointer-like) iterators P ...
- template <class Op, class T, class I=std::make_integer_sequence<int, mp::len<T>>>
- struct Flat;
- template <class Op, class ... P, int ... I>
- struct Flat<Op, std::tuple<P ...>, std::integer_sequence<int, I ...>>
- {
- Op & op;
- std::tuple<P ...> t;
- template <class S> void operator+=(S const & s) { ((std::get<I>(t) += std::get<I>(s)), ...); }
- decltype(auto) operator*() { return op(*std::get<I>(t) ...); } // TODO std::apply(op, t)
- };
- template <class Op, class ... P> inline constexpr
- auto flat(Op & op, P && ... p)
- {
- return Flat<Op, std::tuple<P ...>> { op, std::tuple<P ...> { std::forward<P>(p) ... } };
- }
- // forward decl in atom.H
- // TODO others:
- // * 'static': Like expr, but the operator is compile time (e.g. ::apply()).
- // * 'dynamic': Like expr, but driver is selected at run time (e.g. if args are RANK_ANY).
- template <class Op, class ... P, int ... I>
- struct Expr<Op, std::tuple<P ...>, std::integer_sequence<int, I ...>>
- {
- // A-th argument decides rank and shape.
- constexpr static int A = largest_rank<P ...>::value;
- using PA = std::decay_t<mp::Ref_<std::tuple<P ...>, A>>;
- using NotA = mp::ComplementList_<mp::int_list<A>, std::tuple<mp::int_t<I> ...>>;
- Op op;
- std::tuple<P ...> t;
- // If driver is RANK_ANY, driver selection should wait to run time, unless we can tell that RANK_ANY would be selected anyway.
- constexpr static bool VALID_DRIVER = PA::size_s()!=DIM_BAD ; //&& (PA::rank_s()!=RANK_ANY || sizeof...(P)==1);
- template <int iarg>
- std::enable_if_t<(iarg==mp::len<NotA>), bool>
- check(int const driver_rank) const { return true; }
- template <int iarg>
- std::enable_if_t<(iarg<mp::len<NotA>), bool>
- check(int const driver_rank) const
- {
- rank_t ranki = std::get<mp::Ref_<NotA, iarg>::value>(t).rank();
- // Provide safety where RANK_ANY was selected as driver in a leap of faith. TODO Dynamic driver selection.
- assert(ranki<=driver_rank && "driver not max rank (could be RANK_ANY)");
- for (int k=0; k!=ranki; ++k) {
- dim_t sk0 = std::get<A>(t).size(k);
- if (sk0!=DIM_BAD) { // may be == in subexpressions
- dim_t sk = std::get<mp::Ref_<NotA, iarg>::value>(t).size(k);
- assert((sk==sk0 || sk==DIM_BAD) && "mismatched dimensions");
- }
- }
- return check<iarg+1>(driver_rank);
- }
- // see test-compatibility.C [a1] for forward() here.
- constexpr Expr(Op op_, P ... p_): op(std::forward<Op>(op_)), t(std::forward<P>(p_) ...)
- {
- // TODO Try to static_assert. E.g., size_s() vs size_s() can static_assert if we try real3==real2.
- // TODO Should check only the driver: do this on ply.
- CHECK_BOUNDS(check<0>(rank()));
- }
- template <class J>
- constexpr decltype(auto) at(J const & i)
- {
- return op(std::get<I>(t).at(i) ...);
- }
- constexpr void adv(rank_t k, dim_t d)
- {
- (std::get<I>(t).adv(k, d), ...);
- }
- constexpr bool keep_stride(dim_t step, int z, int j) const
- {
- return (std::get<I>(t).keep_stride(step, z, j) && ...);
- }
- constexpr auto stride(int i) const
- {
- return std::make_tuple(std::get<I>(t).stride(i) ...);
- }
- constexpr decltype(auto) flat()
- {
- return ra::flat(op, std::get<I>(t).flat() ...);
- }
- constexpr decltype(auto) flat() const { return flat(); }
- // there's one size (by A), but each arg has its own strides.
- // Note: do not require driver. This is needed by check for all leaves.
- constexpr dim_t size(int i) const { return std::get<A>(t).size(i); }
- constexpr static dim_t size_s() { return PA::size_s(); }
- constexpr static dim_t size_s(int i) { return PA::size_s(i); }
- constexpr rank_t rank() const { return std::get<A>(t).rank(); }
- constexpr static rank_t rank_s() { return PA::rank_s(); }
- constexpr decltype(auto) shape() const
- {
- static_assert(VALID_DRIVER, "can't drive this xpr");
- return std::get<A>(t).shape();
- }
- // needed for xpr with rank_s()==RANK_ANY, which don't decay to scalar when used as operator arguments.
- operator decltype(*(ra::flat(op, std::get<I>(t).flat() ...)))()
- {
- static_assert(rank_s()==0 || rank_s()==RANK_ANY || (rank_s()==1 && size_s()==1), // for coord types
- "bad rank in conversion to scalar");
- assert(rank()==0 || (rank_s()==1 && size_s()==1)); // for coord types; so fixed only
- return *flat();
- }
- // forward to make sure value y is not misused as ref. Cf. test-ra-8.C
- #define DEF_ASSIGNOPS(OP) template <class X> void operator OP(X && x) \
- { for_each([](auto && y, auto && x) { std::forward<decltype(y)>(y) OP x; }, *this, x); }
- FOR_EACH(DEF_ASSIGNOPS, =, *=, +=, -=, /=)
- #undef DEF_ASSIGNOPS
- };
- template <class Op, class ... P> inline constexpr auto
- expr(Op && op, P && ... p)
- {
- return Expr<Op, std::tuple<P ...>> { std::forward<Op>(op), std::forward<P>(p) ... };
- }
- // Wrappers over expr & ply.
- template <class F, class ... A> inline constexpr auto
- map(F && f, A && ... a)
- {
- return expr(std::forward<F>(f), start(std::forward<A>(a)) ...);
- }
- template <class F, class ... A> inline constexpr void
- for_each(F && f, A && ... a)
- {
- ply(expr(std::forward<F>(f), start(std::forward<A>(a)) ...));
- }
- } // namespace ra
- #undef CHECK_BOUNDS
- #undef RA_CHECK_BOUNDS_RA_EXPR
|