1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145
|
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<title>intrinsic_exponential.hpp Source File</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
<tbody>
<tr style="height: 56px;">
<td id="projectlogo"><img alt="Logo" src="logo-mini.png"/></td>
</tr>
</tbody>
</table>
</div>
<!-- Generated by Doxygen 1.8.0 -->
<div id="navrow1" class="tabs">
<ul class="tablist">
<li><a href="index.html"><span>Main Page</span></a></li>
<li><a href="pages.html"><span>Related Pages</span></a></li>
<li><a href="modules.html"><span>Modules</span></a></li>
<li><a href="annotated.html"><span>Classes</span></a></li>
<li class="current"><a href="files.html"><span>Files</span></a></li>
</ul>
</div>
<div id="navrow2" class="tabs2">
<ul class="tablist">
<li><a href="files.html"><span>File List</span></a></li>
</ul>
</div>
</div>
<div class="header">
<div class="headertitle">
<div class="title">intrinsic_exponential.hpp</div> </div>
</div><!--header-->
<div class="contents">
<a href="a00045.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001
<a name="l00002"></a>00002
<a name="l00003"></a>00003
<a name="l00004"></a>00004
<a name="l00005"></a>00005
<a name="l00006"></a>00006
<a name="l00007"></a>00007
<a name="l00008"></a>00008
<a name="l00009"></a>00009
<a name="l00010"></a>00010
<a name="l00011"></a>00011
<a name="l00012"></a>00012
<a name="l00013"></a>00013
<a name="l00014"></a>00014
<a name="l00015"></a>00015
<a name="l00016"></a>00016
<a name="l00017"></a>00017
<a name="l00018"></a>00018
<a name="l00019"></a>00019
<a name="l00020"></a>00020
<a name="l00021"></a>00021
<a name="l00022"></a>00022
<a name="l00023"></a>00023
<a name="l00024"></a>00024
<a name="l00025"></a>00025
<a name="l00026"></a>00026
<a name="l00027"></a>00027
<a name="l00028"></a>00028
<a name="l00029"></a>00029 <span class="preprocessor">#ifndef glm_detail_intrinsic_exponential</span>
<a name="l00030"></a>00030 <span class="preprocessor"></span><span class="preprocessor">#define glm_detail_intrinsic_exponential</span>
<a name="l00031"></a>00031 <span class="preprocessor"></span>
<a name="l00032"></a>00032 <span class="preprocessor">#include "<a class="code" href="a00083.html" title="OpenGL Mathematics (glm.g-truc.net)">setup.hpp</a>"</span>
<a name="l00033"></a>00033
<a name="l00034"></a>00034 <span class="preprocessor">#if((GLM_ARCH & GLM_ARCH_SSE2) != GLM_ARCH_SSE2)</span>
<a name="l00035"></a>00035 <span class="preprocessor"></span><span class="preprocessor"># error "SSE2 instructions not supported or enabled"</span>
<a name="l00036"></a>00036 <span class="preprocessor"></span><span class="preprocessor">#else</span>
<a name="l00037"></a>00037 <span class="preprocessor"></span>
<a name="l00038"></a>00038 <span class="keyword">namespace </span>glm{
<a name="l00039"></a>00039 <span class="keyword">namespace </span>detail
<a name="l00040"></a>00040 {
<a name="l00041"></a>00041 <span class="comment">/*</span>
<a name="l00042"></a>00042 <span class="comment">GLM_FUNC_QUALIFIER __m128 sse_rsqrt_nr_ss(__m128 const x)</span>
<a name="l00043"></a>00043 <span class="comment">{</span>
<a name="l00044"></a>00044 <span class="comment"> __m128 recip = _mm_rsqrt_ss( x ); // "estimate" opcode</span>
<a name="l00045"></a>00045 <span class="comment"> const static __m128 three = { 3, 3, 3, 3 }; // aligned consts for fast load</span>
<a name="l00046"></a>00046 <span class="comment"> const static __m128 half = { 0.5,0.5,0.5,0.5 };</span>
<a name="l00047"></a>00047 <span class="comment"> __m128 halfrecip = _mm_mul_ss( half, recip );</span>
<a name="l00048"></a>00048 <span class="comment"> __m128 threeminus_xrr = _mm_sub_ss( three, _mm_mul_ss( x, _mm_mul_ss ( recip, recip ) ) );</span>
<a name="l00049"></a>00049 <span class="comment"> return _mm_mul_ss( halfrecip, threeminus_xrr );</span>
<a name="l00050"></a>00050 <span class="comment">}</span>
<a name="l00051"></a>00051 <span class="comment"> </span>
<a name="l00052"></a>00052 <span class="comment">GLM_FUNC_QUALIFIER __m128 sse_normalize_fast_ps( float * RESTRICT vOut, float * RESTRICT vIn )</span>
<a name="l00053"></a>00053 <span class="comment">{</span>
<a name="l00054"></a>00054 <span class="comment"> __m128 x = _mm_load_ss(&vIn[0]);</span>
<a name="l00055"></a>00055 <span class="comment"> __m128 y = _mm_load_ss(&vIn[1]);</span>
<a name="l00056"></a>00056 <span class="comment"> __m128 z = _mm_load_ss(&vIn[2]);</span>
<a name="l00057"></a>00057 <span class="comment"> </span>
<a name="l00058"></a>00058 <span class="comment"> const __m128 l = // compute x*x + y*y + z*z</span>
<a name="l00059"></a>00059 <span class="comment"> _mm_add_ss(</span>
<a name="l00060"></a>00060 <span class="comment"> _mm_add_ss( _mm_mul_ss(x,x),</span>
<a name="l00061"></a>00061 <span class="comment"> _mm_mul_ss(y,y)</span>
<a name="l00062"></a>00062 <span class="comment"> ),</span>
<a name="l00063"></a>00063 <span class="comment"> _mm_mul_ss( z, z )</span>
<a name="l00064"></a>00064 <span class="comment"> );</span>
<a name="l00065"></a>00065 <span class="comment"> </span>
<a name="l00066"></a>00066 <span class="comment"> </span>
<a name="l00067"></a>00067 <span class="comment"> const __m128 rsqt = _mm_rsqrt_nr_ss( l );</span>
<a name="l00068"></a>00068 <span class="comment"> _mm_store_ss( &vOut[0] , _mm_mul_ss( rsqt, x ) );</span>
<a name="l00069"></a>00069 <span class="comment"> _mm_store_ss( &vOut[1] , _mm_mul_ss( rsqt, y ) );</span>
<a name="l00070"></a>00070 <span class="comment"> _mm_store_ss( &vOut[2] , _mm_mul_ss( rsqt, z ) );</span>
<a name="l00071"></a>00071 <span class="comment"> </span>
<a name="l00072"></a>00072 <span class="comment"> return _mm_mul_ss( l , rsqt );</span>
<a name="l00073"></a>00073 <span class="comment">}</span>
<a name="l00074"></a>00074 <span class="comment">*/</span>
<a name="l00075"></a>00075 }<span class="comment">//namespace detail</span>
<a name="l00076"></a>00076 }<span class="comment">//namespace glm</span>
<a name="l00077"></a>00077
<a name="l00078"></a>00078 <span class="preprocessor">#endif//GLM_ARCH</span>
<a name="l00079"></a>00079 <span class="preprocessor"></span><span class="preprocessor">#endif//glm_detail_intrinsic_exponential</span>
</pre></div></div><!-- contents -->
<hr class="footer"/><address class="footer"><small>
Generated by  <a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.0
</small></address>
</body>
</html>
|