2014 Eurobot fork
Dependencies: mbed-rtos mbed QEI
tvmet/loop/Gemv.h@92:4a1225fbb146, 2013-10-15 (annotated)
- Committer:
- rsavitski
- Date:
- Tue Oct 15 12:19:32 2013 +0000
- Revision:
- 92:4a1225fbb146
- Parent:
- 15:9c5aaeda36dc
touch: ripped out 2013-specific bits. Need to address "2014" comments. Rewrite AI layer and other deleted parts.
Who changed what in which revision?
User | Revision | Line number | New contents of line |
---|---|---|---|
madcowswe | 15:9c5aaeda36dc | 1 | /* |
madcowswe | 15:9c5aaeda36dc | 2 | * Tiny Vector Matrix Library |
madcowswe | 15:9c5aaeda36dc | 3 | * Dense Vector Matrix Libary of Tiny size using Expression Templates |
madcowswe | 15:9c5aaeda36dc | 4 | * |
madcowswe | 15:9c5aaeda36dc | 5 | * Copyright (C) 2001 - 2007 Olaf Petzold <opetzold@users.sourceforge.net> |
madcowswe | 15:9c5aaeda36dc | 6 | * |
madcowswe | 15:9c5aaeda36dc | 7 | * This library is free software; you can redistribute it and/or |
madcowswe | 15:9c5aaeda36dc | 8 | * modify it under the terms of the GNU Lesser General Public |
madcowswe | 15:9c5aaeda36dc | 9 | * License as published by the Free Software Foundation; either |
madcowswe | 15:9c5aaeda36dc | 10 | * version 2.1 of the License, or (at your option) any later version. |
madcowswe | 15:9c5aaeda36dc | 11 | * |
madcowswe | 15:9c5aaeda36dc | 12 | * This library is distributed in the hope that it will be useful, |
madcowswe | 15:9c5aaeda36dc | 13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
madcowswe | 15:9c5aaeda36dc | 14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
madcowswe | 15:9c5aaeda36dc | 15 | * Lesser General Public License for more details. |
madcowswe | 15:9c5aaeda36dc | 16 | * |
madcowswe | 15:9c5aaeda36dc | 17 | * You should have received a copy of the GNU Lesser General Public |
madcowswe | 15:9c5aaeda36dc | 18 | * License along with this library; if not, write to the Free Software |
madcowswe | 15:9c5aaeda36dc | 19 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
madcowswe | 15:9c5aaeda36dc | 20 | * |
madcowswe | 15:9c5aaeda36dc | 21 | * $Id: Gemv.h,v 1.7 2007-06-23 15:58:59 opetzold Exp $ |
madcowswe | 15:9c5aaeda36dc | 22 | */ |
madcowswe | 15:9c5aaeda36dc | 23 | |
madcowswe | 15:9c5aaeda36dc | 24 | #ifndef TVMET_LOOP_GEMV_H |
madcowswe | 15:9c5aaeda36dc | 25 | #define TVMET_LOOP_GEMV_H |
madcowswe | 15:9c5aaeda36dc | 26 | |
madcowswe | 15:9c5aaeda36dc | 27 | namespace tvmet { |
madcowswe | 15:9c5aaeda36dc | 28 | |
madcowswe | 15:9c5aaeda36dc | 29 | namespace loop { |
madcowswe | 15:9c5aaeda36dc | 30 | |
madcowswe | 15:9c5aaeda36dc | 31 | |
madcowswe | 15:9c5aaeda36dc | 32 | /** |
madcowswe | 15:9c5aaeda36dc | 33 | * \class gemv Gemv.h "tvmet/loop/Gemv.h" |
madcowswe | 15:9c5aaeda36dc | 34 | * \brief class for matrix-vector product using loop unrolling. |
madcowswe | 15:9c5aaeda36dc | 35 | * using formula |
madcowswe | 15:9c5aaeda36dc | 36 | * \f[ |
madcowswe | 15:9c5aaeda36dc | 37 | * M\,v |
madcowswe | 15:9c5aaeda36dc | 38 | * \f] |
madcowswe | 15:9c5aaeda36dc | 39 | * \par Example: |
madcowswe | 15:9c5aaeda36dc | 40 | * \code |
madcowswe | 15:9c5aaeda36dc | 41 | * template<class T, std::size_t Rows, std::size_t Cols> |
madcowswe | 15:9c5aaeda36dc | 42 | * inline |
madcowswe | 15:9c5aaeda36dc | 43 | * void |
madcowswe | 15:9c5aaeda36dc | 44 | * prod(const Matrix<T, Rows, Cols>& lhs, const Vector<T, Cols>& rhs, |
madcowswe | 15:9c5aaeda36dc | 45 | * Vector<T, Rows>& dest) |
madcowswe | 15:9c5aaeda36dc | 46 | * { |
madcowswe | 15:9c5aaeda36dc | 47 | * for (std::size_t i = 0; i != Rows; ++i) { |
madcowswe | 15:9c5aaeda36dc | 48 | * dest(i) = tvmet::loop::gemv<Rows, Cols>().prod(lhs, rhs, i); |
madcowswe | 15:9c5aaeda36dc | 49 | * } |
madcowswe | 15:9c5aaeda36dc | 50 | * } |
madcowswe | 15:9c5aaeda36dc | 51 | * \endcode |
madcowswe | 15:9c5aaeda36dc | 52 | */ |
madcowswe | 15:9c5aaeda36dc | 53 | template<std::size_t Rows, std::size_t Cols> |
madcowswe | 15:9c5aaeda36dc | 54 | class gemv |
madcowswe | 15:9c5aaeda36dc | 55 | { |
madcowswe | 15:9c5aaeda36dc | 56 | gemv(const gemv&); |
madcowswe | 15:9c5aaeda36dc | 57 | gemv& operator=(const gemv&); |
madcowswe | 15:9c5aaeda36dc | 58 | |
madcowswe | 15:9c5aaeda36dc | 59 | private: |
madcowswe | 15:9c5aaeda36dc | 60 | enum { |
madcowswe | 15:9c5aaeda36dc | 61 | count = Cols, |
madcowswe | 15:9c5aaeda36dc | 62 | N = (count+7)/8 |
madcowswe | 15:9c5aaeda36dc | 63 | }; |
madcowswe | 15:9c5aaeda36dc | 64 | |
madcowswe | 15:9c5aaeda36dc | 65 | public: |
madcowswe | 15:9c5aaeda36dc | 66 | gemv() { } |
madcowswe | 15:9c5aaeda36dc | 67 | |
madcowswe | 15:9c5aaeda36dc | 68 | public: |
madcowswe | 15:9c5aaeda36dc | 69 | template<class E1, class E2> |
madcowswe | 15:9c5aaeda36dc | 70 | static inline |
madcowswe | 15:9c5aaeda36dc | 71 | typename PromoteTraits< |
madcowswe | 15:9c5aaeda36dc | 72 | typename E1::value_type, |
madcowswe | 15:9c5aaeda36dc | 73 | typename E2::value_type |
madcowswe | 15:9c5aaeda36dc | 74 | >::value_type |
madcowswe | 15:9c5aaeda36dc | 75 | prod(const E1& lhs, const E2& rhs, std::size_t i) { |
madcowswe | 15:9c5aaeda36dc | 76 | typename PromoteTraits< |
madcowswe | 15:9c5aaeda36dc | 77 | typename E1::value_type, |
madcowswe | 15:9c5aaeda36dc | 78 | typename E2::value_type |
madcowswe | 15:9c5aaeda36dc | 79 | >::value_type sum(0); |
madcowswe | 15:9c5aaeda36dc | 80 | std::size_t j(0); |
madcowswe | 15:9c5aaeda36dc | 81 | std::size_t n(N); |
madcowswe | 15:9c5aaeda36dc | 82 | |
madcowswe | 15:9c5aaeda36dc | 83 | // Duff's device |
madcowswe | 15:9c5aaeda36dc | 84 | switch(count % 8) { |
madcowswe | 15:9c5aaeda36dc | 85 | case 0: do { sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 86 | case 7: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 87 | case 6: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 88 | case 5: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 89 | case 4: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 90 | case 3: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 91 | case 2: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 92 | case 1: sum += lhs(i, j) * rhs(j); ++j; |
madcowswe | 15:9c5aaeda36dc | 93 | } while(--n != 0); |
madcowswe | 15:9c5aaeda36dc | 94 | } |
madcowswe | 15:9c5aaeda36dc | 95 | |
madcowswe | 15:9c5aaeda36dc | 96 | return sum; |
madcowswe | 15:9c5aaeda36dc | 97 | } |
madcowswe | 15:9c5aaeda36dc | 98 | }; |
madcowswe | 15:9c5aaeda36dc | 99 | |
madcowswe | 15:9c5aaeda36dc | 100 | |
madcowswe | 15:9c5aaeda36dc | 101 | } // namespace loop |
madcowswe | 15:9c5aaeda36dc | 102 | |
madcowswe | 15:9c5aaeda36dc | 103 | } // namespace tvmet |
madcowswe | 15:9c5aaeda36dc | 104 | |
madcowswe | 15:9c5aaeda36dc | 105 | #endif /* TVMET_LOOP_GEMV_H */ |
madcowswe | 15:9c5aaeda36dc | 106 | |
madcowswe | 15:9c5aaeda36dc | 107 | // Local Variables: |
madcowswe | 15:9c5aaeda36dc | 108 | // mode:C++ |
madcowswe | 15:9c5aaeda36dc | 109 | // tab-width:8 |
madcowswe | 15:9c5aaeda36dc | 110 | // End: |