MP3 Player without external hardware MP3 Player without external hardware. A software based MP3 player based on a modified version of libmad. Mono output (at the moment) via AnalogOut. Files are read from an USB drive. This is a demo program, it plays only one file at the moment. Documentation is in "main.cpp" and "config.h"
fixed.h@1:7c923cbe9f1d, 2010-11-26 (annotated)
- Committer:
- Gruenfrosch
- Date:
- Fri Nov 26 13:05:34 2010 +0000
- Revision:
- 1:7c923cbe9f1d
- Parent:
- 0:7627c79db971
Fixed the last warning
Who changed what in which revision?
User | Revision | Line number | New contents of line |
---|---|---|---|
Gruenfrosch | 0:7627c79db971 | 1 | /* |
Gruenfrosch | 0:7627c79db971 | 2 | * libmad - MPEG audio decoder library |
Gruenfrosch | 0:7627c79db971 | 3 | * Copyright (C) 2000-2004 Underbit Technologies, Inc. |
Gruenfrosch | 0:7627c79db971 | 4 | * |
Gruenfrosch | 0:7627c79db971 | 5 | * This program is free software; you can redistribute it and/or modify |
Gruenfrosch | 0:7627c79db971 | 6 | * it under the terms of the GNU General Public License as published by |
Gruenfrosch | 0:7627c79db971 | 7 | * the Free Software Foundation; either version 2 of the License, or |
Gruenfrosch | 0:7627c79db971 | 8 | * (at your option) any later version. |
Gruenfrosch | 0:7627c79db971 | 9 | * |
Gruenfrosch | 0:7627c79db971 | 10 | * This program is distributed in the hope that it will be useful, |
Gruenfrosch | 0:7627c79db971 | 11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
Gruenfrosch | 0:7627c79db971 | 12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
Gruenfrosch | 0:7627c79db971 | 13 | * GNU General Public License for more details. |
Gruenfrosch | 0:7627c79db971 | 14 | * |
Gruenfrosch | 0:7627c79db971 | 15 | * You should have received a copy of the GNU General Public License |
Gruenfrosch | 0:7627c79db971 | 16 | * along with this program; if not, write to the Free Software |
Gruenfrosch | 0:7627c79db971 | 17 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
Gruenfrosch | 0:7627c79db971 | 18 | * |
Gruenfrosch | 0:7627c79db971 | 19 | * $Id: fixed.h,v 1.1 2010/11/23 20:12:57 andy Exp $ |
Gruenfrosch | 0:7627c79db971 | 20 | */ |
Gruenfrosch | 0:7627c79db971 | 21 | |
Gruenfrosch | 0:7627c79db971 | 22 | # ifndef LIBMAD_FIXED_H |
Gruenfrosch | 0:7627c79db971 | 23 | # define LIBMAD_FIXED_H |
Gruenfrosch | 0:7627c79db971 | 24 | |
Gruenfrosch | 0:7627c79db971 | 25 | #include "config.h" |
Gruenfrosch | 0:7627c79db971 | 26 | |
Gruenfrosch | 0:7627c79db971 | 27 | # if SIZEOF_INT >= 4 |
Gruenfrosch | 0:7627c79db971 | 28 | typedef signed int mad_fixed_t; |
Gruenfrosch | 0:7627c79db971 | 29 | |
Gruenfrosch | 0:7627c79db971 | 30 | typedef signed int mad_fixed64hi_t; |
Gruenfrosch | 0:7627c79db971 | 31 | typedef unsigned int mad_fixed64lo_t; |
Gruenfrosch | 0:7627c79db971 | 32 | # else |
Gruenfrosch | 0:7627c79db971 | 33 | typedef signed long mad_fixed_t; |
Gruenfrosch | 0:7627c79db971 | 34 | |
Gruenfrosch | 0:7627c79db971 | 35 | typedef signed long mad_fixed64hi_t; |
Gruenfrosch | 0:7627c79db971 | 36 | typedef unsigned long mad_fixed64lo_t; |
Gruenfrosch | 0:7627c79db971 | 37 | # endif |
Gruenfrosch | 0:7627c79db971 | 38 | |
Gruenfrosch | 0:7627c79db971 | 39 | # if defined(_MSC_VER) |
Gruenfrosch | 0:7627c79db971 | 40 | # define mad_fixed64_t signed __int64 |
Gruenfrosch | 0:7627c79db971 | 41 | # elif 1 || defined(__GNUC__) |
Gruenfrosch | 0:7627c79db971 | 42 | # define mad_fixed64_t signed long long |
Gruenfrosch | 0:7627c79db971 | 43 | # endif |
Gruenfrosch | 0:7627c79db971 | 44 | |
Gruenfrosch | 0:7627c79db971 | 45 | # if defined(FPM_FLOAT) |
Gruenfrosch | 0:7627c79db971 | 46 | typedef double mad_sample_t; |
Gruenfrosch | 0:7627c79db971 | 47 | # else |
Gruenfrosch | 0:7627c79db971 | 48 | typedef mad_fixed_t mad_sample_t; |
Gruenfrosch | 0:7627c79db971 | 49 | # endif |
Gruenfrosch | 0:7627c79db971 | 50 | |
Gruenfrosch | 0:7627c79db971 | 51 | /* |
Gruenfrosch | 0:7627c79db971 | 52 | * Fixed-point format: 0xABBBBBBB |
Gruenfrosch | 0:7627c79db971 | 53 | * A == whole part (sign + 3 bits) |
Gruenfrosch | 0:7627c79db971 | 54 | * B == fractional part (28 bits) |
Gruenfrosch | 0:7627c79db971 | 55 | * |
Gruenfrosch | 0:7627c79db971 | 56 | * Values are signed two's complement, so the effective range is: |
Gruenfrosch | 0:7627c79db971 | 57 | * 0x80000000 to 0x7fffffff |
Gruenfrosch | 0:7627c79db971 | 58 | * -8.0 to +7.9999999962747097015380859375 |
Gruenfrosch | 0:7627c79db971 | 59 | * |
Gruenfrosch | 0:7627c79db971 | 60 | * The smallest representable value is: |
Gruenfrosch | 0:7627c79db971 | 61 | * 0x00000001 == 0.0000000037252902984619140625 (i.e. about 3.725e-9) |
Gruenfrosch | 0:7627c79db971 | 62 | * |
Gruenfrosch | 0:7627c79db971 | 63 | * 28 bits of fractional accuracy represent about |
Gruenfrosch | 0:7627c79db971 | 64 | * 8.6 digits of decimal accuracy. |
Gruenfrosch | 0:7627c79db971 | 65 | * |
Gruenfrosch | 0:7627c79db971 | 66 | * Fixed-point numbers can be added or subtracted as normal |
Gruenfrosch | 0:7627c79db971 | 67 | * integers, but multiplication requires shifting the 64-bit result |
Gruenfrosch | 0:7627c79db971 | 68 | * from 56 fractional bits back to 28 (and rounding.) |
Gruenfrosch | 0:7627c79db971 | 69 | * |
Gruenfrosch | 0:7627c79db971 | 70 | * Changing the definition of MAD_F_FRACBITS is only partially |
Gruenfrosch | 0:7627c79db971 | 71 | * supported, and must be done with care. |
Gruenfrosch | 0:7627c79db971 | 72 | */ |
Gruenfrosch | 0:7627c79db971 | 73 | |
Gruenfrosch | 0:7627c79db971 | 74 | # define MAD_F_FRACBITS 28 |
Gruenfrosch | 0:7627c79db971 | 75 | |
Gruenfrosch | 0:7627c79db971 | 76 | # if MAD_F_FRACBITS == 28 |
Gruenfrosch | 0:7627c79db971 | 77 | # define MAD_F(x) ((mad_fixed_t) (x##L)) |
Gruenfrosch | 0:7627c79db971 | 78 | # else |
Gruenfrosch | 0:7627c79db971 | 79 | # if MAD_F_FRACBITS < 28 |
Gruenfrosch | 0:7627c79db971 | 80 | # warning "MAD_F_FRACBITS < 28" |
Gruenfrosch | 0:7627c79db971 | 81 | # define MAD_F(x) ((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 82 | (((x##L) + \ |
Gruenfrosch | 0:7627c79db971 | 83 | (1L << (28 - MAD_F_FRACBITS - 1))) >> \ |
Gruenfrosch | 0:7627c79db971 | 84 | (28 - MAD_F_FRACBITS))) |
Gruenfrosch | 0:7627c79db971 | 85 | # elif MAD_F_FRACBITS > 28 |
Gruenfrosch | 0:7627c79db971 | 86 | # error "MAD_F_FRACBITS > 28 not currently supported" |
Gruenfrosch | 0:7627c79db971 | 87 | # define MAD_F(x) ((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 88 | ((x##L) << (MAD_F_FRACBITS - 28))) |
Gruenfrosch | 0:7627c79db971 | 89 | # endif |
Gruenfrosch | 0:7627c79db971 | 90 | # endif |
Gruenfrosch | 0:7627c79db971 | 91 | |
Gruenfrosch | 0:7627c79db971 | 92 | # define MAD_F_MIN ((mad_fixed_t) -0x80000000L) |
Gruenfrosch | 0:7627c79db971 | 93 | # define MAD_F_MAX ((mad_fixed_t) +0x7fffffffL) |
Gruenfrosch | 0:7627c79db971 | 94 | |
Gruenfrosch | 0:7627c79db971 | 95 | # define MAD_F_ONE MAD_F(0x10000000) |
Gruenfrosch | 0:7627c79db971 | 96 | |
Gruenfrosch | 0:7627c79db971 | 97 | # define mad_f_tofixed(x) ((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 98 | ((x) * (double) (1L << MAD_F_FRACBITS) + 0.5)) |
Gruenfrosch | 0:7627c79db971 | 99 | # define mad_f_todouble(x) ((double) \ |
Gruenfrosch | 0:7627c79db971 | 100 | ((x) / (double) (1L << MAD_F_FRACBITS))) |
Gruenfrosch | 0:7627c79db971 | 101 | |
Gruenfrosch | 0:7627c79db971 | 102 | # define mad_f_intpart(x) ((x) >> MAD_F_FRACBITS) |
Gruenfrosch | 0:7627c79db971 | 103 | # define mad_f_fracpart(x) ((x) & ((1L << MAD_F_FRACBITS) - 1)) |
Gruenfrosch | 0:7627c79db971 | 104 | /* (x should be positive) */ |
Gruenfrosch | 0:7627c79db971 | 105 | |
Gruenfrosch | 0:7627c79db971 | 106 | # define mad_f_fromint(x) ((x) << MAD_F_FRACBITS) |
Gruenfrosch | 0:7627c79db971 | 107 | |
Gruenfrosch | 0:7627c79db971 | 108 | # define mad_f_add(x, y) ((x) + (y)) |
Gruenfrosch | 0:7627c79db971 | 109 | # define mad_f_sub(x, y) ((x) - (y)) |
Gruenfrosch | 0:7627c79db971 | 110 | |
Gruenfrosch | 0:7627c79db971 | 111 | # if defined(FPM_FLOAT) |
Gruenfrosch | 0:7627c79db971 | 112 | # error "FPM_FLOAT not yet supported" |
Gruenfrosch | 0:7627c79db971 | 113 | |
Gruenfrosch | 0:7627c79db971 | 114 | # undef MAD_F |
Gruenfrosch | 0:7627c79db971 | 115 | # define MAD_F(x) mad_f_todouble(x) |
Gruenfrosch | 0:7627c79db971 | 116 | |
Gruenfrosch | 0:7627c79db971 | 117 | # define mad_f_mul(x, y) ((x) * (y)) |
Gruenfrosch | 0:7627c79db971 | 118 | # define mad_f_scale64 |
Gruenfrosch | 0:7627c79db971 | 119 | |
Gruenfrosch | 0:7627c79db971 | 120 | # undef ASO_ZEROCHECK |
Gruenfrosch | 0:7627c79db971 | 121 | |
Gruenfrosch | 0:7627c79db971 | 122 | # elif defined(FPM_64BIT) |
Gruenfrosch | 0:7627c79db971 | 123 | |
Gruenfrosch | 0:7627c79db971 | 124 | /* |
Gruenfrosch | 0:7627c79db971 | 125 | * This version should be the most accurate if 64-bit types are supported by |
Gruenfrosch | 0:7627c79db971 | 126 | * the compiler, although it may not be the most efficient. |
Gruenfrosch | 0:7627c79db971 | 127 | */ |
Gruenfrosch | 0:7627c79db971 | 128 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 129 | # define mad_f_mul(x, y) \ |
Gruenfrosch | 0:7627c79db971 | 130 | ((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 131 | ((((mad_fixed64_t) (x) * (y)) + \ |
Gruenfrosch | 0:7627c79db971 | 132 | (1L << (MAD_F_SCALEBITS - 1))) >> MAD_F_SCALEBITS)) |
Gruenfrosch | 0:7627c79db971 | 133 | # else |
Gruenfrosch | 0:7627c79db971 | 134 | # define mad_f_mul(x, y) \ |
Gruenfrosch | 0:7627c79db971 | 135 | ((mad_fixed_t) (((mad_fixed64_t) (x) * (y)) >> MAD_F_SCALEBITS)) |
Gruenfrosch | 0:7627c79db971 | 136 | # endif |
Gruenfrosch | 0:7627c79db971 | 137 | |
Gruenfrosch | 0:7627c79db971 | 138 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 139 | |
Gruenfrosch | 0:7627c79db971 | 140 | /* --- Intel --------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 141 | |
Gruenfrosch | 0:7627c79db971 | 142 | # elif defined(FPM_INTEL) |
Gruenfrosch | 0:7627c79db971 | 143 | |
Gruenfrosch | 0:7627c79db971 | 144 | # if defined(_MSC_VER) |
Gruenfrosch | 0:7627c79db971 | 145 | # pragma warning(push) |
Gruenfrosch | 0:7627c79db971 | 146 | # pragma warning(disable: 4035) /* no return value */ |
Gruenfrosch | 0:7627c79db971 | 147 | static __forceinline |
Gruenfrosch | 0:7627c79db971 | 148 | mad_fixed_t mad_f_mul_inline(mad_fixed_t x, mad_fixed_t y) |
Gruenfrosch | 0:7627c79db971 | 149 | { |
Gruenfrosch | 0:7627c79db971 | 150 | enum { |
Gruenfrosch | 0:7627c79db971 | 151 | fracbits = MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 152 | }; |
Gruenfrosch | 0:7627c79db971 | 153 | |
Gruenfrosch | 0:7627c79db971 | 154 | __asm { |
Gruenfrosch | 0:7627c79db971 | 155 | mov eax, x |
Gruenfrosch | 0:7627c79db971 | 156 | imul y |
Gruenfrosch | 0:7627c79db971 | 157 | shrd eax, edx, fracbits |
Gruenfrosch | 0:7627c79db971 | 158 | } |
Gruenfrosch | 0:7627c79db971 | 159 | |
Gruenfrosch | 0:7627c79db971 | 160 | /* implicit return of eax */ |
Gruenfrosch | 0:7627c79db971 | 161 | } |
Gruenfrosch | 0:7627c79db971 | 162 | # pragma warning(pop) |
Gruenfrosch | 0:7627c79db971 | 163 | |
Gruenfrosch | 0:7627c79db971 | 164 | # define mad_f_mul mad_f_mul_inline |
Gruenfrosch | 0:7627c79db971 | 165 | # define mad_f_scale64 |
Gruenfrosch | 0:7627c79db971 | 166 | # else |
Gruenfrosch | 0:7627c79db971 | 167 | /* |
Gruenfrosch | 0:7627c79db971 | 168 | * This Intel version is fast and accurate; the disposition of the least |
Gruenfrosch | 0:7627c79db971 | 169 | * significant bit depends on OPT_ACCURACY via mad_f_scale64(). |
Gruenfrosch | 0:7627c79db971 | 170 | */ |
Gruenfrosch | 0:7627c79db971 | 171 | # define MAD_F_MLX(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 172 | asm ("imull %3" \ |
Gruenfrosch | 0:7627c79db971 | 173 | : "=a" (lo), "=d" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 174 | : "%a" (x), "rm" (y) \ |
Gruenfrosch | 0:7627c79db971 | 175 | : "cc") |
Gruenfrosch | 0:7627c79db971 | 176 | |
Gruenfrosch | 0:7627c79db971 | 177 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 178 | /* |
Gruenfrosch | 0:7627c79db971 | 179 | * This gives best accuracy but is not very fast. |
Gruenfrosch | 0:7627c79db971 | 180 | */ |
Gruenfrosch | 0:7627c79db971 | 181 | # define MAD_F_MLA(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 182 | ({ mad_fixed64hi_t __hi; \ |
Gruenfrosch | 0:7627c79db971 | 183 | mad_fixed64lo_t __lo; \ |
Gruenfrosch | 0:7627c79db971 | 184 | MAD_F_MLX(__hi, __lo, (x), (y)); \ |
Gruenfrosch | 0:7627c79db971 | 185 | asm ("addl %2,%0\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 186 | "adcl %3,%1" \ |
Gruenfrosch | 0:7627c79db971 | 187 | : "=rm" (lo), "=rm" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 188 | : "r" (__lo), "r" (__hi), "0" (lo), "1" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 189 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 190 | }) |
Gruenfrosch | 0:7627c79db971 | 191 | # endif /* OPT_ACCURACY */ |
Gruenfrosch | 0:7627c79db971 | 192 | |
Gruenfrosch | 0:7627c79db971 | 193 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 194 | /* |
Gruenfrosch | 0:7627c79db971 | 195 | * Surprisingly, this is faster than SHRD followed by ADC. |
Gruenfrosch | 0:7627c79db971 | 196 | */ |
Gruenfrosch | 0:7627c79db971 | 197 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 198 | ({ mad_fixed64hi_t __hi_; \ |
Gruenfrosch | 0:7627c79db971 | 199 | mad_fixed64lo_t __lo_; \ |
Gruenfrosch | 0:7627c79db971 | 200 | mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 201 | asm ("addl %4,%2\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 202 | "adcl %5,%3" \ |
Gruenfrosch | 0:7627c79db971 | 203 | : "=rm" (__lo_), "=rm" (__hi_) \ |
Gruenfrosch | 0:7627c79db971 | 204 | : "0" (lo), "1" (hi), \ |
Gruenfrosch | 0:7627c79db971 | 205 | "ir" (1L << (MAD_F_SCALEBITS - 1)), "ir" (0) \ |
Gruenfrosch | 0:7627c79db971 | 206 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 207 | asm ("shrdl %3,%2,%1" \ |
Gruenfrosch | 0:7627c79db971 | 208 | : "=rm" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 209 | : "0" (__lo_), "r" (__hi_), "I" (MAD_F_SCALEBITS) \ |
Gruenfrosch | 0:7627c79db971 | 210 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 211 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 212 | }) |
Gruenfrosch | 0:7627c79db971 | 213 | # elif defined(OPT_INTEL) |
Gruenfrosch | 0:7627c79db971 | 214 | /* |
Gruenfrosch | 0:7627c79db971 | 215 | * Alternate Intel scaling that may or may not perform better. |
Gruenfrosch | 0:7627c79db971 | 216 | */ |
Gruenfrosch | 0:7627c79db971 | 217 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 218 | ({ mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 219 | asm ("shrl %3,%1\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 220 | "shll %4,%2\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 221 | "orl %2,%1" \ |
Gruenfrosch | 0:7627c79db971 | 222 | : "=rm" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 223 | : "0" (lo), "r" (hi), \ |
Gruenfrosch | 0:7627c79db971 | 224 | "I" (MAD_F_SCALEBITS), "I" (32 - MAD_F_SCALEBITS) \ |
Gruenfrosch | 0:7627c79db971 | 225 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 226 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 227 | }) |
Gruenfrosch | 0:7627c79db971 | 228 | # else |
Gruenfrosch | 0:7627c79db971 | 229 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 230 | ({ mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 231 | asm ("shrdl %3,%2,%1" \ |
Gruenfrosch | 0:7627c79db971 | 232 | : "=rm" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 233 | : "0" (lo), "r" (hi), "I" (MAD_F_SCALEBITS) \ |
Gruenfrosch | 0:7627c79db971 | 234 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 235 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 236 | }) |
Gruenfrosch | 0:7627c79db971 | 237 | # endif /* OPT_ACCURACY */ |
Gruenfrosch | 0:7627c79db971 | 238 | |
Gruenfrosch | 0:7627c79db971 | 239 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 240 | # endif |
Gruenfrosch | 0:7627c79db971 | 241 | |
Gruenfrosch | 0:7627c79db971 | 242 | /* --- ARM ----------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 243 | |
Gruenfrosch | 0:7627c79db971 | 244 | # elif defined(FPM_ARM) |
Gruenfrosch | 0:7627c79db971 | 245 | |
Gruenfrosch | 0:7627c79db971 | 246 | /* |
Gruenfrosch | 0:7627c79db971 | 247 | * This ARM V4 version is as accurate as FPM_64BIT but much faster. The |
Gruenfrosch | 0:7627c79db971 | 248 | * least significant bit is properly rounded at no CPU cycle cost! |
Gruenfrosch | 0:7627c79db971 | 249 | */ |
Gruenfrosch | 0:7627c79db971 | 250 | # if 1 |
Gruenfrosch | 0:7627c79db971 | 251 | /* |
Gruenfrosch | 0:7627c79db971 | 252 | * This is faster than the default implementation via MAD_F_MLX() and |
Gruenfrosch | 0:7627c79db971 | 253 | * mad_f_scale64(). |
Gruenfrosch | 0:7627c79db971 | 254 | */ |
Gruenfrosch | 0:7627c79db971 | 255 | # define mad_f_mul(x, y) \ |
Gruenfrosch | 0:7627c79db971 | 256 | ({ mad_fixed64hi_t __hi; \ |
Gruenfrosch | 0:7627c79db971 | 257 | mad_fixed64lo_t __lo; \ |
Gruenfrosch | 0:7627c79db971 | 258 | mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 259 | asm ("smull %0, %1, %3, %4\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 260 | "movs %0, %0, lsr %5\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 261 | "adc %2, %0, %1, lsl %6" \ |
Gruenfrosch | 0:7627c79db971 | 262 | : "=&r" (__lo), "=&r" (__hi), "=r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 263 | : "%r" (x), "r" (y), \ |
Gruenfrosch | 0:7627c79db971 | 264 | "M" (MAD_F_SCALEBITS), "M" (32 - MAD_F_SCALEBITS) \ |
Gruenfrosch | 0:7627c79db971 | 265 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 266 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 267 | }) |
Gruenfrosch | 0:7627c79db971 | 268 | # endif |
Gruenfrosch | 0:7627c79db971 | 269 | |
Gruenfrosch | 0:7627c79db971 | 270 | # define MAD_F_MLX(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 271 | asm ("smull %0, %1, %2, %3" \ |
Gruenfrosch | 0:7627c79db971 | 272 | : "=&r" (lo), "=&r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 273 | : "%r" (x), "r" (y)) |
Gruenfrosch | 0:7627c79db971 | 274 | |
Gruenfrosch | 0:7627c79db971 | 275 | # define MAD_F_MLA(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 276 | asm ("smlal %0, %1, %2, %3" \ |
Gruenfrosch | 0:7627c79db971 | 277 | : "+r" (lo), "+r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 278 | : "%r" (x), "r" (y)) |
Gruenfrosch | 0:7627c79db971 | 279 | |
Gruenfrosch | 0:7627c79db971 | 280 | # define MAD_F_MLN(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 281 | asm ("rsbs %0, %2, #0\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 282 | "rsc %1, %3, #0" \ |
Gruenfrosch | 0:7627c79db971 | 283 | : "=r" (lo), "=r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 284 | : "0" (lo), "1" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 285 | : "cc") |
Gruenfrosch | 0:7627c79db971 | 286 | |
Gruenfrosch | 0:7627c79db971 | 287 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 288 | ({ mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 289 | asm ("movs %0, %1, lsr %3\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 290 | "adc %0, %0, %2, lsl %4" \ |
Gruenfrosch | 0:7627c79db971 | 291 | : "=&r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 292 | : "r" (lo), "r" (hi), \ |
Gruenfrosch | 0:7627c79db971 | 293 | "M" (MAD_F_SCALEBITS), "M" (32 - MAD_F_SCALEBITS) \ |
Gruenfrosch | 0:7627c79db971 | 294 | : "cc"); \ |
Gruenfrosch | 0:7627c79db971 | 295 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 296 | }) |
Gruenfrosch | 0:7627c79db971 | 297 | |
Gruenfrosch | 0:7627c79db971 | 298 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 299 | |
Gruenfrosch | 0:7627c79db971 | 300 | /* --- MIPS ---------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 301 | |
Gruenfrosch | 0:7627c79db971 | 302 | # elif defined(FPM_MIPS) |
Gruenfrosch | 0:7627c79db971 | 303 | |
Gruenfrosch | 0:7627c79db971 | 304 | /* |
Gruenfrosch | 0:7627c79db971 | 305 | * This MIPS version is fast and accurate; the disposition of the least |
Gruenfrosch | 0:7627c79db971 | 306 | * significant bit depends on OPT_ACCURACY via mad_f_scale64(). |
Gruenfrosch | 0:7627c79db971 | 307 | */ |
Gruenfrosch | 0:7627c79db971 | 308 | # define MAD_F_MLX(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 309 | asm ("mult %2,%3" \ |
Gruenfrosch | 0:7627c79db971 | 310 | : "=l" (lo), "=h" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 311 | : "%r" (x), "r" (y)) |
Gruenfrosch | 0:7627c79db971 | 312 | |
Gruenfrosch | 0:7627c79db971 | 313 | # if defined(HAVE_MADD_ASM) |
Gruenfrosch | 0:7627c79db971 | 314 | # define MAD_F_MLA(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 315 | asm ("madd %2,%3" \ |
Gruenfrosch | 0:7627c79db971 | 316 | : "+l" (lo), "+h" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 317 | : "%r" (x), "r" (y)) |
Gruenfrosch | 0:7627c79db971 | 318 | # elif defined(HAVE_MADD16_ASM) |
Gruenfrosch | 0:7627c79db971 | 319 | /* |
Gruenfrosch | 0:7627c79db971 | 320 | * This loses significant accuracy due to the 16-bit integer limit in the |
Gruenfrosch | 0:7627c79db971 | 321 | * multiply/accumulate instruction. |
Gruenfrosch | 0:7627c79db971 | 322 | */ |
Gruenfrosch | 0:7627c79db971 | 323 | # define MAD_F_ML0(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 324 | asm ("mult %2,%3" \ |
Gruenfrosch | 0:7627c79db971 | 325 | : "=l" (lo), "=h" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 326 | : "%r" ((x) >> 12), "r" ((y) >> 16)) |
Gruenfrosch | 0:7627c79db971 | 327 | # define MAD_F_MLA(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 328 | asm ("madd16 %2,%3" \ |
Gruenfrosch | 0:7627c79db971 | 329 | : "+l" (lo), "+h" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 330 | : "%r" ((x) >> 12), "r" ((y) >> 16)) |
Gruenfrosch | 0:7627c79db971 | 331 | # define MAD_F_MLZ(hi, lo) ((mad_fixed_t) (lo)) |
Gruenfrosch | 0:7627c79db971 | 332 | # endif |
Gruenfrosch | 0:7627c79db971 | 333 | |
Gruenfrosch | 0:7627c79db971 | 334 | # if defined(OPT_SPEED) |
Gruenfrosch | 0:7627c79db971 | 335 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 336 | ((mad_fixed_t) ((hi) << (32 - MAD_F_SCALEBITS))) |
Gruenfrosch | 0:7627c79db971 | 337 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 338 | # endif |
Gruenfrosch | 0:7627c79db971 | 339 | |
Gruenfrosch | 0:7627c79db971 | 340 | /* --- SPARC --------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 341 | |
Gruenfrosch | 0:7627c79db971 | 342 | # elif defined(FPM_SPARC) |
Gruenfrosch | 0:7627c79db971 | 343 | |
Gruenfrosch | 0:7627c79db971 | 344 | /* |
Gruenfrosch | 0:7627c79db971 | 345 | * This SPARC V8 version is fast and accurate; the disposition of the least |
Gruenfrosch | 0:7627c79db971 | 346 | * significant bit depends on OPT_ACCURACY via mad_f_scale64(). |
Gruenfrosch | 0:7627c79db971 | 347 | */ |
Gruenfrosch | 0:7627c79db971 | 348 | # define MAD_F_MLX(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 349 | asm ("smul %2, %3, %0\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 350 | "rd %%y, %1" \ |
Gruenfrosch | 0:7627c79db971 | 351 | : "=r" (lo), "=r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 352 | : "%r" (x), "rI" (y)) |
Gruenfrosch | 0:7627c79db971 | 353 | |
Gruenfrosch | 0:7627c79db971 | 354 | /* --- PowerPC ------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 355 | |
Gruenfrosch | 0:7627c79db971 | 356 | # elif defined(FPM_PPC) |
Gruenfrosch | 0:7627c79db971 | 357 | |
Gruenfrosch | 0:7627c79db971 | 358 | /* |
Gruenfrosch | 0:7627c79db971 | 359 | * This PowerPC version is fast and accurate; the disposition of the least |
Gruenfrosch | 0:7627c79db971 | 360 | * significant bit depends on OPT_ACCURACY via mad_f_scale64(). |
Gruenfrosch | 0:7627c79db971 | 361 | */ |
Gruenfrosch | 0:7627c79db971 | 362 | # define MAD_F_MLX(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 363 | do { \ |
Gruenfrosch | 0:7627c79db971 | 364 | asm ("mullw %0,%1,%2" \ |
Gruenfrosch | 0:7627c79db971 | 365 | : "=r" (lo) \ |
Gruenfrosch | 0:7627c79db971 | 366 | : "%r" (x), "r" (y)); \ |
Gruenfrosch | 0:7627c79db971 | 367 | asm ("mulhw %0,%1,%2" \ |
Gruenfrosch | 0:7627c79db971 | 368 | : "=r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 369 | : "%r" (x), "r" (y)); \ |
Gruenfrosch | 0:7627c79db971 | 370 | } \ |
Gruenfrosch | 0:7627c79db971 | 371 | while (0) |
Gruenfrosch | 0:7627c79db971 | 372 | |
Gruenfrosch | 0:7627c79db971 | 373 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 374 | /* |
Gruenfrosch | 0:7627c79db971 | 375 | * This gives best accuracy but is not very fast. |
Gruenfrosch | 0:7627c79db971 | 376 | */ |
Gruenfrosch | 0:7627c79db971 | 377 | # define MAD_F_MLA(hi, lo, x, y) \ |
Gruenfrosch | 0:7627c79db971 | 378 | ({ mad_fixed64hi_t __hi; \ |
Gruenfrosch | 0:7627c79db971 | 379 | mad_fixed64lo_t __lo; \ |
Gruenfrosch | 0:7627c79db971 | 380 | MAD_F_MLX(__hi, __lo, (x), (y)); \ |
Gruenfrosch | 0:7627c79db971 | 381 | asm ("addc %0,%2,%3\n\t" \ |
Gruenfrosch | 0:7627c79db971 | 382 | "adde %1,%4,%5" \ |
Gruenfrosch | 0:7627c79db971 | 383 | : "=r" (lo), "=r" (hi) \ |
Gruenfrosch | 0:7627c79db971 | 384 | : "%r" (lo), "r" (__lo), \ |
Gruenfrosch | 0:7627c79db971 | 385 | "%r" (hi), "r" (__hi) \ |
Gruenfrosch | 0:7627c79db971 | 386 | : "xer"); \ |
Gruenfrosch | 0:7627c79db971 | 387 | }) |
Gruenfrosch | 0:7627c79db971 | 388 | # endif |
Gruenfrosch | 0:7627c79db971 | 389 | |
Gruenfrosch | 0:7627c79db971 | 390 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 391 | /* |
Gruenfrosch | 0:7627c79db971 | 392 | * This is slower than the truncating version below it. |
Gruenfrosch | 0:7627c79db971 | 393 | */ |
Gruenfrosch | 0:7627c79db971 | 394 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 395 | ({ mad_fixed_t __result, __round; \ |
Gruenfrosch | 0:7627c79db971 | 396 | asm ("rotrwi %0,%1,%2" \ |
Gruenfrosch | 0:7627c79db971 | 397 | : "=r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 398 | : "r" (lo), "i" (MAD_F_SCALEBITS)); \ |
Gruenfrosch | 0:7627c79db971 | 399 | asm ("extrwi %0,%1,1,0" \ |
Gruenfrosch | 0:7627c79db971 | 400 | : "=r" (__round) \ |
Gruenfrosch | 0:7627c79db971 | 401 | : "r" (__result)); \ |
Gruenfrosch | 0:7627c79db971 | 402 | asm ("insrwi %0,%1,%2,0" \ |
Gruenfrosch | 0:7627c79db971 | 403 | : "+r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 404 | : "r" (hi), "i" (MAD_F_SCALEBITS)); \ |
Gruenfrosch | 0:7627c79db971 | 405 | asm ("add %0,%1,%2" \ |
Gruenfrosch | 0:7627c79db971 | 406 | : "=r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 407 | : "%r" (__result), "r" (__round)); \ |
Gruenfrosch | 0:7627c79db971 | 408 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 409 | }) |
Gruenfrosch | 0:7627c79db971 | 410 | # else |
Gruenfrosch | 0:7627c79db971 | 411 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 412 | ({ mad_fixed_t __result; \ |
Gruenfrosch | 0:7627c79db971 | 413 | asm ("rotrwi %0,%1,%2" \ |
Gruenfrosch | 0:7627c79db971 | 414 | : "=r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 415 | : "r" (lo), "i" (MAD_F_SCALEBITS)); \ |
Gruenfrosch | 0:7627c79db971 | 416 | asm ("insrwi %0,%1,%2,0" \ |
Gruenfrosch | 0:7627c79db971 | 417 | : "+r" (__result) \ |
Gruenfrosch | 0:7627c79db971 | 418 | : "r" (hi), "i" (MAD_F_SCALEBITS)); \ |
Gruenfrosch | 0:7627c79db971 | 419 | __result; \ |
Gruenfrosch | 0:7627c79db971 | 420 | }) |
Gruenfrosch | 0:7627c79db971 | 421 | # endif |
Gruenfrosch | 0:7627c79db971 | 422 | |
Gruenfrosch | 0:7627c79db971 | 423 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 424 | |
Gruenfrosch | 0:7627c79db971 | 425 | /* --- Default ------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 426 | |
Gruenfrosch | 0:7627c79db971 | 427 | # elif defined(FPM_DEFAULT) |
Gruenfrosch | 0:7627c79db971 | 428 | |
Gruenfrosch | 0:7627c79db971 | 429 | /* |
Gruenfrosch | 0:7627c79db971 | 430 | * This version is the most portable but it loses significant accuracy. |
Gruenfrosch | 0:7627c79db971 | 431 | * Furthermore, accuracy is biased against the second argument, so care |
Gruenfrosch | 0:7627c79db971 | 432 | * should be taken when ordering operands. |
Gruenfrosch | 0:7627c79db971 | 433 | * |
Gruenfrosch | 0:7627c79db971 | 434 | * The scale factors are constant as this is not used with SSO. |
Gruenfrosch | 0:7627c79db971 | 435 | * |
Gruenfrosch | 0:7627c79db971 | 436 | * Pre-rounding is required to stay within the limits of compliance. |
Gruenfrosch | 0:7627c79db971 | 437 | */ |
Gruenfrosch | 0:7627c79db971 | 438 | # if defined(OPT_SPEED) |
Gruenfrosch | 0:7627c79db971 | 439 | # define mad_f_mul(x, y) (((x) >> 12) * ((y) >> 16)) |
Gruenfrosch | 0:7627c79db971 | 440 | # else |
Gruenfrosch | 0:7627c79db971 | 441 | # define mad_f_mul(x, y) ((((x) + (1L << 11)) >> 12) * \ |
Gruenfrosch | 0:7627c79db971 | 442 | (((y) + (1L << 15)) >> 16)) |
Gruenfrosch | 0:7627c79db971 | 443 | # endif |
Gruenfrosch | 0:7627c79db971 | 444 | |
Gruenfrosch | 0:7627c79db971 | 445 | /* ------------------------------------------------------------------------- */ |
Gruenfrosch | 0:7627c79db971 | 446 | |
Gruenfrosch | 0:7627c79db971 | 447 | # else |
Gruenfrosch | 0:7627c79db971 | 448 | # error "no FPM selected" |
Gruenfrosch | 0:7627c79db971 | 449 | # endif |
Gruenfrosch | 0:7627c79db971 | 450 | |
Gruenfrosch | 0:7627c79db971 | 451 | /* default implementations */ |
Gruenfrosch | 0:7627c79db971 | 452 | |
Gruenfrosch | 0:7627c79db971 | 453 | # if !defined(mad_f_mul) |
Gruenfrosch | 0:7627c79db971 | 454 | # define mad_f_mul(x, y) \ |
Gruenfrosch | 0:7627c79db971 | 455 | ({ register mad_fixed64hi_t __hi; \ |
Gruenfrosch | 0:7627c79db971 | 456 | register mad_fixed64lo_t __lo; \ |
Gruenfrosch | 0:7627c79db971 | 457 | MAD_F_MLX(__hi, __lo, (x), (y)); \ |
Gruenfrosch | 0:7627c79db971 | 458 | mad_f_scale64(__hi, __lo); \ |
Gruenfrosch | 0:7627c79db971 | 459 | }) |
Gruenfrosch | 0:7627c79db971 | 460 | # endif |
Gruenfrosch | 0:7627c79db971 | 461 | |
Gruenfrosch | 0:7627c79db971 | 462 | # if !defined(MAD_F_MLA) |
Gruenfrosch | 0:7627c79db971 | 463 | # define MAD_F_ML0(hi, lo, x, y) ((lo) = mad_f_mul((x), (y))) |
Gruenfrosch | 0:7627c79db971 | 464 | # define MAD_F_MLA(hi, lo, x, y) ((lo) += mad_f_mul((x), (y))) |
Gruenfrosch | 0:7627c79db971 | 465 | # define MAD_F_MLN(hi, lo) ((lo) = -(lo)) |
Gruenfrosch | 0:7627c79db971 | 466 | # define MAD_F_MLZ(hi, lo) ((void) (hi), (mad_fixed_t) (lo)) |
Gruenfrosch | 0:7627c79db971 | 467 | # endif |
Gruenfrosch | 0:7627c79db971 | 468 | |
Gruenfrosch | 0:7627c79db971 | 469 | # if !defined(MAD_F_ML0) |
Gruenfrosch | 0:7627c79db971 | 470 | # define MAD_F_ML0(hi, lo, x, y) MAD_F_MLX((hi), (lo), (x), (y)) |
Gruenfrosch | 0:7627c79db971 | 471 | # endif |
Gruenfrosch | 0:7627c79db971 | 472 | |
Gruenfrosch | 0:7627c79db971 | 473 | # if !defined(MAD_F_MLN) |
Gruenfrosch | 0:7627c79db971 | 474 | # define MAD_F_MLN(hi, lo) ((hi) = ((lo) = -(lo)) ? ~(hi) : -(hi)) |
Gruenfrosch | 0:7627c79db971 | 475 | # endif |
Gruenfrosch | 0:7627c79db971 | 476 | |
Gruenfrosch | 0:7627c79db971 | 477 | # if !defined(MAD_F_MLZ) |
Gruenfrosch | 0:7627c79db971 | 478 | # define MAD_F_MLZ(hi, lo) mad_f_scale64((hi), (lo)) |
Gruenfrosch | 0:7627c79db971 | 479 | # endif |
Gruenfrosch | 0:7627c79db971 | 480 | |
Gruenfrosch | 0:7627c79db971 | 481 | # if !defined(mad_f_scale64) |
Gruenfrosch | 0:7627c79db971 | 482 | # if defined(OPT_ACCURACY) |
Gruenfrosch | 0:7627c79db971 | 483 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 484 | ((((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 485 | (((hi) << (32 - (MAD_F_SCALEBITS - 1))) | \ |
Gruenfrosch | 0:7627c79db971 | 486 | ((lo) >> (MAD_F_SCALEBITS - 1)))) + 1) >> 1) |
Gruenfrosch | 0:7627c79db971 | 487 | # else |
Gruenfrosch | 0:7627c79db971 | 488 | # define mad_f_scale64(hi, lo) \ |
Gruenfrosch | 0:7627c79db971 | 489 | ((mad_fixed_t) \ |
Gruenfrosch | 0:7627c79db971 | 490 | (((hi) << (32 - MAD_F_SCALEBITS)) | \ |
Gruenfrosch | 0:7627c79db971 | 491 | ((lo) >> MAD_F_SCALEBITS))) |
Gruenfrosch | 0:7627c79db971 | 492 | # endif |
Gruenfrosch | 0:7627c79db971 | 493 | # define MAD_F_SCALEBITS MAD_F_FRACBITS |
Gruenfrosch | 0:7627c79db971 | 494 | # endif |
Gruenfrosch | 0:7627c79db971 | 495 | |
Gruenfrosch | 0:7627c79db971 | 496 | /* C routines */ |
Gruenfrosch | 0:7627c79db971 | 497 | |
Gruenfrosch | 0:7627c79db971 | 498 | mad_fixed_t mad_f_abs(mad_fixed_t); |
Gruenfrosch | 0:7627c79db971 | 499 | mad_fixed_t mad_f_div(mad_fixed_t, mad_fixed_t); |
Gruenfrosch | 0:7627c79db971 | 500 | |
Gruenfrosch | 0:7627c79db971 | 501 | # endif |